[["Random", "mmlu-pro_all", 10, 10, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.2, 0.4, 0.1, 0.2, 0.4]], ["Random", "mmlu-pro_all", 10, 10, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4, 0.5, 0.4, 0.4, 0.5]], ["Random", "mmlu-pro_all", 10, 10, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.2, 0.3, 0.3, 0.3, 0.4]], ["Random", "mmlu-pro_all", 10, 10, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4, 0.3, 0.3, 0.3, 0.4]], ["Random", "mmlu-pro_all", 10, 10, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4, 0.6, 0.4, 0.6, 0.5]], ["Random", "mmlu-pro_all", 10, 10, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4, 0.4, 0.5, 0.2, 0.5]], ["Random", "mmlu-pro_all", 10, 10, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.5, 0.6, 0.3, 0.5, 0.7]], ["Random", "mmlu-pro_all", 10, 10, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.6, 0.6, 0.4, 0.5, 0.4]], ["Random", "mmlu-pro_all", 10, 10, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.2, 0.3, 0.2, 0.3, 0.3]], ["Random", "mmlu-pro_all", 10, 10, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.5, 0.5, 0.3, 0.5, 0.2]], ["Random", "mmlu-pro_all", 25, 25, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.48, 0.52, 0.28, 0.52, 0.44]], ["Random", "mmlu-pro_all", 25, 25, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.56, 0.52, 0.36, 0.64, 0.52]], ["Random", "mmlu-pro_all", 25, 25, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.2, 0.36, 0.4, 0.44, 0.24]], ["Random", "mmlu-pro_all", 25, 25, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4, 0.48, 0.24, 0.44, 0.48]], ["Random", "mmlu-pro_all", 25, 25, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.44, 0.6, 0.52, 0.56, 0.64]], ["Random", "mmlu-pro_all", 25, 25, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.44, 0.28, 0.64, 0.28, 0.4]], ["Random", "mmlu-pro_all", 25, 25, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4, 0.52, 0.44, 0.6, 0.44]], ["Random", "mmlu-pro_all", 25, 25, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.36, 0.52, 0.44, 0.52, 0.48]], ["Random", "mmlu-pro_all", 25, 25, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.48, 0.44, 0.24, 0.36, 0.52]], ["Random", "mmlu-pro_all", 25, 25, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4, 0.44, 0.2, 0.44, 0.44]], ["Random", "mmlu-pro_all", 50, 50, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.32, 0.48, 0.36, 0.48, 0.4]], ["Random", "mmlu-pro_all", 50, 50, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.44, 0.54, 0.42, 0.5, 0.54]], ["Random", "mmlu-pro_all", 50, 50, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.34, 0.46, 0.34, 0.46, 0.36]], ["Random", "mmlu-pro_all", 50, 50, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4, 0.52, 0.4, 0.56, 0.52]], ["Random", "mmlu-pro_all", 50, 50, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.54, 0.52, 0.5, 0.48, 0.54]], ["Random", "mmlu-pro_all", 50, 50, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.46, 0.52, 0.42, 0.6, 0.52]], ["Random", "mmlu-pro_all", 50, 50, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.34, 0.46, 0.42, 0.42, 0.4]], ["Random", "mmlu-pro_all", 50, 50, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4, 0.38, 0.46, 0.48, 0.48]], ["Random", "mmlu-pro_all", 50, 50, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.36, 0.38, 0.28, 0.32, 0.4]], ["Random", "mmlu-pro_all", 50, 50, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4, 0.42, 0.28, 0.38, 0.48]], ["Random", "mmlu-pro_all", 100, 100, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.41, 0.45, 0.32, 0.4, 0.47]], ["Random", "mmlu-pro_all", 100, 100, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.44, 0.49, 0.41, 0.47, 0.44]], ["Random", "mmlu-pro_all", 100, 100, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.47, 0.47, 0.37, 0.48, 0.47]], ["Random", "mmlu-pro_all", 100, 100, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4, 0.44, 0.38, 0.48, 0.42]], ["Random", "mmlu-pro_all", 100, 100, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.41, 0.43, 0.34, 0.43, 0.44]], ["Random", "mmlu-pro_all", 100, 100, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.37, 0.4, 0.33, 0.43, 0.5]], ["Random", "mmlu-pro_all", 100, 100, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.37, 0.4, 0.41, 0.42, 0.46]], ["Random", "mmlu-pro_all", 100, 100, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.45, 0.53, 0.44, 0.53, 0.51]], ["Random", "mmlu-pro_all", 100, 100, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.47, 0.49, 0.41, 0.51, 0.48]], ["Random", "mmlu-pro_all", 100, 100, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.44, 0.42, 0.4, 0.42, 0.4]], ["Random", "mmlu-pro_all", 250, 250, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.364, 0.388, 0.34, 0.428, 0.424]], ["Random", "mmlu-pro_all", 250, 250, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.412, 0.532, 0.336, 0.528, 0.5]], ["Random", "mmlu-pro_all", 250, 250, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.388, 0.484, 0.328, 0.468, 0.456]], ["Random", "mmlu-pro_all", 250, 250, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.424, 0.492, 0.332, 0.476, 0.512]], ["Random", "mmlu-pro_all", 250, 250, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.436, 0.468, 0.408, 0.484, 0.472]], ["Random", "mmlu-pro_all", 250, 250, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.416, 0.444, 0.352, 0.464, 0.476]], ["Random", "mmlu-pro_all", 250, 250, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4, 0.396, 0.344, 0.428, 0.432]], ["Random", "mmlu-pro_all", 250, 250, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.396, 0.444, 0.34, 0.468, 0.464]], ["Random", "mmlu-pro_all", 250, 250, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.36, 0.416, 0.364, 0.4, 0.424]], ["Random", "mmlu-pro_all", 250, 250, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.404, 0.44, 0.368, 0.48, 0.444]], ["Random", "mmlu-pro_all", 500, 500, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.458, 0.492, 0.426, 0.512, 0.498]], ["Random", "mmlu-pro_all", 500, 500, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.454, 0.548, 0.362, 0.538, 0.524]], ["Random", "mmlu-pro_all", 500, 500, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.426, 0.504, 0.36, 0.5, 0.49]], ["Random", "mmlu-pro_all", 500, 500, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.406, 0.472, 0.376, 0.466, 0.468]], ["Random", "mmlu-pro_all", 500, 500, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.43, 0.488, 0.396, 0.482, 0.508]], ["Random", "mmlu-pro_all", 500, 500, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.406, 0.466, 0.356, 0.488, 0.444]], ["Random", "mmlu-pro_all", 500, 500, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.434, 0.476, 0.378, 0.472, 0.468]], ["Random", "mmlu-pro_all", 500, 500, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.406, 0.462, 0.366, 0.478, 0.492]], ["Random", "mmlu-pro_all", 500, 500, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.418, 0.48, 0.348, 0.48, 0.476]], ["Random", "mmlu-pro_all", 500, 500, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.436, 0.468, 0.402, 0.48, 0.49]], ["Random", "mmlu-pro_all", 1000, 1000, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.408, 0.435, 0.356, 0.478, 0.445]], ["Random", "mmlu-pro_all", 1000, 1000, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.438, 0.504, 0.38, 0.51, 0.489]], ["Random", "mmlu-pro_all", 1000, 1000, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.406, 0.472, 0.371, 0.471, 0.468]], ["Random", "mmlu-pro_all", 1000, 1000, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.384, 0.443, 0.361, 0.458, 0.465]], ["Random", "mmlu-pro_all", 1000, 1000, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.409, 0.477, 0.382, 0.473, 0.475]], ["Random", "mmlu-pro_all", 1000, 1000, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.401, 0.445, 0.375, 0.471, 0.466]], ["Random", "mmlu-pro_all", 1000, 1000, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.417, 0.44, 0.359, 0.454, 0.448]], ["Random", "mmlu-pro_all", 1000, 1000, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.407, 0.458, 0.369, 0.463, 0.465]], ["Random", "mmlu-pro_all", 1000, 1000, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.405, 0.472, 0.361, 0.469, 0.474]], ["Random", "mmlu-pro_all", 1000, 1000, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.431, 0.469, 0.381, 0.469, 0.473]], ["Anchor_Points_Weighted", "mmlu-pro_all", 10, 10, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.41672824591119584, 0.3984263680917083, 0.3325860549167118, 0.4236018853319639, 0.4791697107270968]], ["Anchor_Points_Weighted", "mmlu-pro_all", 10, 10, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4995512661300312, 0.5680650890412339, 0.5074916514126601, 0.6272060940587765, 0.5585245040036765]], ["Anchor_Points_Weighted", "mmlu-pro_all", 10, 10, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.32384613725006917, 0.5453870242900476, 0.28413638700479477, 0.5585155076924931, 0.643590575217504]], ["Anchor_Points_Weighted", "mmlu-pro_all", 10, 10, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.5511930101475515, 0.6053304410194438, 0.42151290871549485, 0.6260233914364387, 0.6959020923341362]], ["Anchor_Points_Weighted", "mmlu-pro_all", 10, 10, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3242467709135986, 0.5030140686350603, 0.36697477830247177, 0.5770621264043917, 0.5201286068264819]], ["Anchor_Points_Weighted", "mmlu-pro_all", 10, 10, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.5284863159765762, 0.6262015688255023, 0.5039103956885171, 0.6509413916278823, 0.6726858568622829]], ["Anchor_Points_Weighted", "mmlu-pro_all", 10, 10, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.44228212285979057, 0.5119085833560146, 0.33757546322941134, 0.5605061349643445, 0.6066294128805141]], ["Anchor_Points_Weighted", "mmlu-pro_all", 10, 10, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.6835969713869008, 0.6077933655105925, 0.37594617802200647, 0.6478477111258258, 0.6408858197962056]], ["Anchor_Points_Weighted", "mmlu-pro_all", 10, 10, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.5603563645851267, 0.4922764515572441, 0.34276163427278833, 0.5324080445725733, 0.558211968445507]], ["Anchor_Points_Weighted", "mmlu-pro_all", 10, 10, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4927479951455127, 0.5885520761889683, 0.3941403140960836, 0.6155321550924866, 0.7005258687265188]], ["Anchor_Points_Weighted", "mmlu-pro_all", 25, 25, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4570590426462842, 0.45620011367014035, 0.32257233588836987, 0.5000034110801915, 0.5459927034176423]], ["Anchor_Points_Weighted", "mmlu-pro_all", 25, 25, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.41651304383307564, 0.4527074997621241, 0.32226803510456026, 0.5059608819912855, 0.5248765610786706]], ["Anchor_Points_Weighted", "mmlu-pro_all", 25, 25, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.38789630536563147, 0.47129565620173314, 0.31022201495708557, 0.5080634555452539, 0.5611552157465987]], ["Anchor_Points_Weighted", "mmlu-pro_all", 25, 25, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4483142427337492, 0.47599378079104626, 0.36381095545537917, 0.4995875002581843, 0.5961223356887753]], ["Anchor_Points_Weighted", "mmlu-pro_all", 25, 25, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4354143133743441, 0.45755046470572275, 0.31000390326525923, 0.504424534622357, 0.5730992919561132]], ["Anchor_Points_Weighted", "mmlu-pro_all", 25, 25, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.40872331828455905, 0.39993309601770843, 0.3353065389545856, 0.4515522160665595, 0.46218266068108776]], ["Anchor_Points_Weighted", "mmlu-pro_all", 25, 25, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4564043623768524, 0.45523095918728557, 0.35552721254077624, 0.48704975433027675, 0.5315597036365055]], ["Anchor_Points_Weighted", "mmlu-pro_all", 25, 25, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.41665376774328133, 0.429556923738762, 0.24792453544772883, 0.435736286122098, 0.5320373322324078]], ["Anchor_Points_Weighted", "mmlu-pro_all", 25, 25, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4452158823402341, 0.4317290340649603, 0.35792320889223966, 0.46426247716599567, 0.5419234251409644]], ["Anchor_Points_Weighted", "mmlu-pro_all", 25, 25, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4189248876451741, 0.493080882460652, 0.2941984053321602, 0.5110471522950083, 0.5755546710815045]], ["Anchor_Points_Weighted", "mmlu-pro_all", 50, 50, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4451907245738921, 0.4451713974715771, 0.3128727474629231, 0.4787400089786243, 0.5349411767169143]], ["Anchor_Points_Weighted", "mmlu-pro_all", 50, 50, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.41989089207168445, 0.4381372590432779, 0.3358468037581529, 0.47855944194148137, 0.48917176111778066]], ["Anchor_Points_Weighted", "mmlu-pro_all", 50, 50, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4136981716694552, 0.4693884691897931, 0.28630578105361737, 0.4930956139296407, 0.532970369561113]], ["Anchor_Points_Weighted", "mmlu-pro_all", 50, 50, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4492522610580464, 0.4567654340865346, 0.333034995232667, 0.4717372451940033, 0.5400034527640369]], ["Anchor_Points_Weighted", "mmlu-pro_all", 50, 50, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3971599823940781, 0.4333484095219208, 0.31876635251709656, 0.47193828726085746, 0.5171600877335408]], ["Anchor_Points_Weighted", "mmlu-pro_all", 50, 50, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4089561310136107, 0.4311608615471587, 0.309959119654595, 0.4584976589682086, 0.5063231304556309]], ["Anchor_Points_Weighted", "mmlu-pro_all", 50, 50, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4464721277315645, 0.4486002984184598, 0.3146820191070477, 0.4847246887778175, 0.5208167479744901]], ["Anchor_Points_Weighted", "mmlu-pro_all", 50, 50, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.41520144586328633, 0.43577654787329584, 0.28964128063782163, 0.4549190873366928, 0.5418048925866018]], ["Anchor_Points_Weighted", "mmlu-pro_all", 50, 50, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4125237889571937, 0.4260100873698595, 0.31849291816276576, 0.4648241862236457, 0.500795643434814]], ["Anchor_Points_Weighted", "mmlu-pro_all", 50, 50, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3851863964165112, 0.4303430791928698, 0.2639501581314791, 0.4551204771439193, 0.5219368151594299]], ["Anchor_Points_Weighted", "mmlu-pro_all", 100, 100, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4381893283686486, 0.42473942331405307, 0.3097095553048917, 0.46165243137893025, 0.5121838525840696]], ["Anchor_Points_Weighted", "mmlu-pro_all", 100, 100, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.42334104858785343, 0.4386285728594163, 0.32837266996035375, 0.4699271843658445, 0.5053143607607323]], ["Anchor_Points_Weighted", "mmlu-pro_all", 100, 100, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4131716280427437, 0.4548976259072843, 0.28578252806506566, 0.47156697035491196, 0.5235682331677748]], ["Anchor_Points_Weighted", "mmlu-pro_all", 100, 100, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.44905364198348147, 0.4326546049899376, 0.33572133806981647, 0.45848225697584793, 0.5272762289250545]], ["Anchor_Points_Weighted", "mmlu-pro_all", 100, 100, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.39993042094785275, 0.4277568606204375, 0.3075971861237657, 0.46305511606888167, 0.5076017906898618]], ["Anchor_Points_Weighted", "mmlu-pro_all", 100, 100, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.38877280996955227, 0.4312978183257878, 0.28910751283693387, 0.4604461441315253, 0.5025864657033269]], ["Anchor_Points_Weighted", "mmlu-pro_all", 100, 100, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.44127971375290354, 0.44576910955571875, 0.3147749474220237, 0.47244608169383867, 0.5146428551134012]], ["Anchor_Points_Weighted", "mmlu-pro_all", 100, 100, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3757233601413878, 0.4135782138221043, 0.2722168614409212, 0.44468556981747653, 0.5119246528282626]], ["Anchor_Points_Weighted", "mmlu-pro_all", 100, 100, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4172442902975147, 0.41378020796479825, 0.3107572921365997, 0.4534098009135348, 0.48831902300675534]], ["Anchor_Points_Weighted", "mmlu-pro_all", 100, 100, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.39442779651844573, 0.419956008176377, 0.2929171870818764, 0.44260445453995084, 0.5012168414978511]], ["Anchor_Points_Weighted", "mmlu-pro_all", 250, 250, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.43108474069785596, 0.4238053585581303, 0.30305478005597253, 0.45769045346431964, 0.5042826171747633]], ["Anchor_Points_Weighted", "mmlu-pro_all", 250, 250, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.41512887555708944, 0.43488654367351753, 0.31200456881708327, 0.46070813490890605, 0.5065364347004889]], ["Anchor_Points_Weighted", "mmlu-pro_all", 250, 250, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.40932231199561375, 0.43560096110208324, 0.2864273180526602, 0.4595574058845833, 0.4947762533341409]], ["Anchor_Points_Weighted", "mmlu-pro_all", 250, 250, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4242943187252475, 0.4247998474699436, 0.3062706215925958, 0.45445994764199105, 0.5023702085844136]], ["Anchor_Points_Weighted", "mmlu-pro_all", 250, 250, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.39934947802669185, 0.41425180949937607, 0.2970979084831783, 0.45277330378781155, 0.49148444514697925]], ["Anchor_Points_Weighted", "mmlu-pro_all", 250, 250, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.39762305231559314, 0.41455163025624414, 0.29502868563995543, 0.44565787096174303, 0.48608827225544887]], ["Anchor_Points_Weighted", "mmlu-pro_all", 250, 250, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4305443740625911, 0.4244095274630089, 0.3151146134014102, 0.4555803896049169, 0.5003748282194401]], ["Anchor_Points_Weighted", "mmlu-pro_all", 250, 250, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4007618112083127, 0.4054144174343538, 0.27767255199270924, 0.432891346717845, 0.4961980725576517]], ["Anchor_Points_Weighted", "mmlu-pro_all", 250, 250, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.41417420943082184, 0.40478467485105607, 0.2992833338769779, 0.4430188506499817, 0.48727825691812954]], ["Anchor_Points_Weighted", "mmlu-pro_all", 250, 250, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4022611116135047, 0.4102056367182174, 0.2996562290663139, 0.4338811892508648, 0.48934462627568387]], ["Anchor_Points_Weighted", "mmlu-pro_all", 500, 500, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.42092960031805254, 0.414778983838591, 0.29302338247472365, 0.4445502993766757, 0.4847812740874381]], ["Anchor_Points_Weighted", "mmlu-pro_all", 500, 500, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4086561419150146, 0.4246043022834082, 0.30760070042266974, 0.448827194378437, 0.4913454507447724]], ["Anchor_Points_Weighted", "mmlu-pro_all", 500, 500, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.39996359226168976, 0.4298797615176084, 0.2859855346366238, 0.44725049604796485, 0.48954603761155957]], ["Anchor_Points_Weighted", "mmlu-pro_all", 500, 500, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.41192862009117953, 0.4149093086583021, 0.2988913376582546, 0.4414364826214161, 0.4939616035016119]], ["Anchor_Points_Weighted", "mmlu-pro_all", 500, 500, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3975868952165888, 0.4079086147573041, 0.2892888621664609, 0.4427566012559693, 0.4851518469217042]], ["Anchor_Points_Weighted", "mmlu-pro_all", 500, 500, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4000871380646588, 0.40732456873224676, 0.30662693249212275, 0.4326673114608359, 0.47670799101463723]], ["Anchor_Points_Weighted", "mmlu-pro_all", 500, 500, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4207987183179655, 0.4164766656411272, 0.3047619348314725, 0.44375059914052417, 0.48637215701382885]], ["Anchor_Points_Weighted", "mmlu-pro_all", 500, 500, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.39368384741174534, 0.40068570391484726, 0.28605808713159353, 0.4284887320448526, 0.4856881296235921]], ["Anchor_Points_Weighted", "mmlu-pro_all", 500, 500, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.40430897213086214, 0.4072143188364138, 0.29701435872063714, 0.43617617569887135, 0.4857445472655614]], ["Anchor_Points_Weighted", "mmlu-pro_all", 500, 500, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3961477995140138, 0.4020978647367105, 0.2932929176898109, 0.42340490558888333, 0.4777756884718995]], ["Anchor_Points_Weighted", "mmlu-pro_all", 1000, 1000, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.41308657616034544, 0.4117430808530015, 0.29323055597132874, 0.4387543502869106, 0.47812650987609273]], ["Anchor_Points_Weighted", "mmlu-pro_all", 1000, 1000, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4058295699674392, 0.41883054417655224, 0.3028869799588097, 0.4404474387149734, 0.4817886618519049]], ["Anchor_Points_Weighted", "mmlu-pro_all", 1000, 1000, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.39917953544259954, 0.4244684598452909, 0.2775845515818317, 0.44432981215147244, 0.4855880640217467]], ["Anchor_Points_Weighted", "mmlu-pro_all", 1000, 1000, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.407610035588134, 0.4075124143244262, 0.2998377286671022, 0.4365094887252506, 0.4817974793267131]], ["Anchor_Points_Weighted", "mmlu-pro_all", 1000, 1000, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.39460765372054485, 0.4047896265089278, 0.2921276374113132, 0.4366433953150925, 0.4802427825464939]], ["Anchor_Points_Weighted", "mmlu-pro_all", 1000, 1000, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3974010737610845, 0.40266553627561996, 0.3004764684214454, 0.43101302560603505, 0.4712552558367863]], ["Anchor_Points_Weighted", "mmlu-pro_all", 1000, 1000, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.41460975457016175, 0.414784770834539, 0.29617289329536967, 0.4427136061417932, 0.48816802664334713]], ["Anchor_Points_Weighted", "mmlu-pro_all", 1000, 1000, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3917020692391083, 0.3976510898472285, 0.29339830403012385, 0.4244084210277049, 0.47786328684356527]], ["Anchor_Points_Weighted", "mmlu-pro_all", 1000, 1000, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.40636556602051266, 0.401712428285434, 0.2893484025473575, 0.43071599950642625, 0.47368345839878434]], ["Anchor_Points_Weighted", "mmlu-pro_all", 1000, 1000, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3928524396910105, 0.3993466009095614, 0.2946757562564068, 0.4214459175054618, 0.46934563127350437]], ["tinyBenchmarks", "mmlu-pro_all", 10, 10, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4567531603459748, 0.3305056553559548, 0.12624750499002, 0.42864271457085834, 0.3734198270126415]], ["tinyBenchmarks", "mmlu-pro_all", 25, 25, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.39088489687292094, 0.39371257485029953, 0.35063206919494355, 0.37242182302062554, 0.42498336660013314]], ["tinyBenchmarks", "mmlu-pro_all", 50, 50, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.37840984697272134, 0.49667332002661363, 0.41151031270791755, 0.4657351962741186, 0.36077844311377255]], ["tinyBenchmarks", "mmlu-pro_all", 100, 100, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4248170326014639, 0.39953426480372595, 0.3536260811709914, 0.42930805056553567, 0.46590153027278775]], ["tinyBenchmarks", "mmlu-pro_all", 250, 250, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4176646706586827, 0.4524284763805722, 0.3850632069194943, 0.4735528942115768, 0.46606786427145697]], ["tinyBenchmarks", "mmlu-pro_all", 500, 500, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4196606786427142, 0.4422821024617427, 0.3507984031936128, 0.4499334664005321, 0.44377910844976676]], ["tinyBenchmarks", "mmlu-pro_all", 1000, 1000, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.41932801064537795, 0.44644045242847885, 0.35844976713240323, 0.4510978043912201, 0.4386227544910203]], ["tinyBenchmarks", "mmlu-pro_all", 10, 10, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.7964071856287427, 0.33582834331337336, 0.2914171656686627, 0.5751829673985364, 0.573519627411843]], ["tinyBenchmarks", "mmlu-pro_all", 25, 25, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.46224218230206265, 0.4803725881570193, 0.3654357950765137, 0.5061543579507652, 0.4602461743180307]], ["tinyBenchmarks", "mmlu-pro_all", 50, 50, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4001996007984033, 0.5149700598802396, 0.2885894876912842, 0.47122421823020627, 0.4241516966067866]], ["tinyBenchmarks", "mmlu-pro_all", 100, 100, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4055222887558217, 0.4975049900199601, 0.4000332667997339, 0.47737857618097146, 0.511144377910845]], ["tinyBenchmarks", "mmlu-pro_all", 250, 250, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4161676646706587, 0.4818695941450433, 0.3516300731869595, 0.4943446440452431, 0.4647371922821024]], ["tinyBenchmarks", "mmlu-pro_all", 500, 500, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3957085828343312, 0.46340652029274754, 0.33749168330006635, 0.4710578842315364, 0.46706586826347235]], ["tinyBenchmarks", "mmlu-pro_all", 1000, 1000, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.40901530272787945, 0.46756487025948335, 0.35096473719228327, 0.4702262142381925, 0.4562541583499687]], ["tinyBenchmarks", "mmlu-pro_all", 10, 10, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3950432468396541, 0.2816034597471724, 0.2816034597471724, 0.3557884231536927, 0.34481037924151703]], ["tinyBenchmarks", "mmlu-pro_all", 25, 25, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.44577511643379913, 0.5156353958749169, 0.3541250831669994, 0.48353293413173665, 0.48153692614770466]], ["tinyBenchmarks", "mmlu-pro_all", 50, 50, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3785761809713906, 0.4525948103792416, 0.2691284098469727, 0.46290751829673993, 0.44444444444444453]], ["tinyBenchmarks", "mmlu-pro_all", 100, 100, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.40552228875582164, 0.4309713905522289, 0.3915502328675981, 0.4236526946107784, 0.41417165668662675]], ["tinyBenchmarks", "mmlu-pro_all", 250, 250, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.39570858283433136, 0.46091151031270805, 0.3574517631403861, 0.46689953426480385, 0.452761144377911]], ["tinyBenchmarks", "mmlu-pro_all", 500, 500, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.40186294078509655, 0.4632401862940784, 0.3519627411842979, 0.44910179640718545, 0.45059880239520955]], ["tinyBenchmarks", "mmlu-pro_all", 1000, 1000, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.399201596806389, 0.4672322022621448, 0.3631071190951443, 0.46523619427811286, 0.4479374584165025]], ["tinyBenchmarks", "mmlu-pro_all", 10, 10, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4234863606121092, 0.5179640718562876, 0.07218895542248838, 0.32401862940785103, 0.21556886227544914]], ["tinyBenchmarks", "mmlu-pro_all", 25, 25, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.36693280106453763, 0.5013306719893547, 0.3363273453093813, 0.47388556220891553, 0.39520958083832336]], ["tinyBenchmarks", "mmlu-pro_all", 50, 50, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4201596806387226, 0.3923819028609448, 0.36477045908183636, 0.4095143047238856, 0.4048569527611444]], ["tinyBenchmarks", "mmlu-pro_all", 100, 100, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.47504990019960075, 0.47421823020625403, 0.4016966067864271, 0.49451097804391203, 0.46490352628077164]], ["tinyBenchmarks", "mmlu-pro_all", 250, 250, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4535928143712575, 0.48935462408516295, 0.4011976047904191, 0.45359281437125754, 0.5063206919494345]], ["tinyBenchmarks", "mmlu-pro_all", 500, 500, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4471057884231538, 0.44461077844311375, 0.3809048569527612, 0.4562541583499668, 0.46573519627411847]], ["tinyBenchmarks", "mmlu-pro_all", 1000, 1000, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.41383898868929, 0.46107784431137905, 0.37624750499002085, 0.46007984031936333, 0.46889554224883756]], ["tinyBenchmarks", "mmlu-pro_all", 10, 10, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.38339986693280115, 0.38339986693280115, 0.2471723220226215, 0.38339986693280115, 0.4770459081836329]], ["tinyBenchmarks", "mmlu-pro_all", 25, 25, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4777112441783101, 0.41051230871590166, 0.2880904856952762, 0.39687292082501674, 0.5896540252827678]], ["tinyBenchmarks", "mmlu-pro_all", 50, 50, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.5104790419161677, 0.4833666001330672, 0.41134397870924816, 0.518296739853626, 0.4758815701929474]], ["tinyBenchmarks", "mmlu-pro_all", 100, 100, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.46856287425149695, 0.5041583499667331, 0.3957085828343313, 0.5161343978709247, 0.4890219560878242]], ["tinyBenchmarks", "mmlu-pro_all", 250, 250, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4396207584830339, 0.46290751829674, 0.3180306054557552, 0.45858283433133745, 0.45991350632069206]], ["tinyBenchmarks", "mmlu-pro_all", 500, 500, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.41101131071190933, 0.455089820359281, 0.3707584830339317, 0.45891550232867573, 0.46756487025948096]], ["tinyBenchmarks", "mmlu-pro_all", 1000, 1000, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.42714570858283557, 0.4630738522954111, 0.3666001330671999, 0.4649035262807738, 0.46440452428476586]], ["tinyBenchmarks", "mmlu-pro_all", 10, 10, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4851962741184299, 0.6556886227544911, 0.2982368596141052, 0.4673985362608118, 0.4003659347970726]], ["tinyBenchmarks", "mmlu-pro_all", 25, 25, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3160345974717233, 0.42198935462408527, 0.2997338656021291, 0.36044577511643383, 0.3050565535595476]], ["tinyBenchmarks", "mmlu-pro_all", 50, 50, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3571190951430473, 0.42498336660013314, 0.3285096473719229, 0.41200931470392554, 0.3880572188955423]], ["tinyBenchmarks", "mmlu-pro_all", 100, 100, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.40352628077178965, 0.4479374584165002, 0.3258483033932136, 0.42664670658682624, 0.4522621423819029]], ["tinyBenchmarks", "mmlu-pro_all", 250, 250, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.37807717897538257, 0.4381237524950101, 0.35894876912841, 0.4354624085163008, 0.4377910844976716]], ["tinyBenchmarks", "mmlu-pro_all", 500, 500, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4091816367265468, 0.47072521623419816, 0.34381237524950115, 0.46290751829673976, 0.4703925482368595]], ["tinyBenchmarks", "mmlu-pro_all", 1000, 1000, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.40302727877578337, 0.46540252827678175, 0.3532934131736537, 0.4649035262807737, 0.4569194943446459]], ["tinyBenchmarks", "mmlu-pro_all", 10, 10, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.6543579507651365, 0.37558216899534275, 0.5355954757152362, 0.5716899534264804, 0.5716899534264804]], ["tinyBenchmarks", "mmlu-pro_all", 25, 25, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.416333998669328, 0.46240851630073193, 0.37824351297405195, 0.4271457085828344, 0.4718895542248836]], ["tinyBenchmarks", "mmlu-pro_all", 50, 50, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.43646041250831685, 0.5706919494344644, 0.4888556220891552, 0.5192947438456421, 0.4792082501663341]], ["tinyBenchmarks", "mmlu-pro_all", 100, 100, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.42481703260146375, 0.47588157019294747, 0.39121756487025944, 0.44228210246174315, 0.5108117099135063]], ["tinyBenchmarks", "mmlu-pro_all", 250, 250, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4622421823020625, 0.4725548902195608, 0.38023952095808383, 0.49068529607451744, 0.4958416500332666]], ["tinyBenchmarks", "mmlu-pro_all", 500, 500, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4321357285429143, 0.4639055222887558, 0.4153359946773122, 0.46939454424484367, 0.4871922821024616]], ["tinyBenchmarks", "mmlu-pro_all", 1000, 1000, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.40851630073187123, 0.4788755821689975, 0.3870592149035275, 0.4680638722554911, 0.48652694610778685]], ["tinyBenchmarks", "mmlu-pro_all", 10, 10, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.408183632734531, 0.42747837658017307, 0.3832335329341318, 0.31620093147039263, 0.33017298735861617]], ["tinyBenchmarks", "mmlu-pro_all", 25, 25, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.36061210911510316, 0.43596141051230886, 0.3847305389221558, 0.43596141051230886, 0.3810711909514305]], ["tinyBenchmarks", "mmlu-pro_all", 50, 50, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3685961410512309, 0.3789088489687293, 0.3732534930139721, 0.4374584165003327, 0.4520958083832336]], ["tinyBenchmarks", "mmlu-pro_all", 100, 100, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.395043246839654, 0.5094810379241517, 0.39337990685296076, 0.49550898203592814, 0.4783765801729873]], ["tinyBenchmarks", "mmlu-pro_all", 250, 250, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.42681304058549585, 0.4549234863606122, 0.380738522954092, 0.4750499001996009, 0.44893546240851645]], ["tinyBenchmarks", "mmlu-pro_all", 500, 500, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3960412508316694, 0.48320026613439715, 0.3952095808383229, 0.48785761809713835, 0.45808383233532857]], ["tinyBenchmarks", "mmlu-pro_all", 1000, 1000, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.41067864271457205, 0.4692282102461761, 0.3651031270791762, 0.46423819028609636, 0.45891550232867784]], ["tinyBenchmarks", "mmlu-pro_all", 10, 10, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.33150365934797077, 0.33150365934797077, 0.5582168995342649, 0.4925149700598804, 0.4266467065868264]], ["tinyBenchmarks", "mmlu-pro_all", 25, 25, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.39387890884896876, 0.365103127079175, 0.439620758483034, 0.490851630073187, 0.427478376580173]], ["tinyBenchmarks", "mmlu-pro_all", 50, 50, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.46889554224883584, 0.441616766467066, 0.454258150365935, 0.5869926813040588, 0.4760479041916169]], ["tinyBenchmarks", "mmlu-pro_all", 100, 100, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.37691284098469724, 0.47039254823685955, 0.30405854956753153, 0.48735861610113096, 0.4637391882900864]], ["tinyBenchmarks", "mmlu-pro_all", 250, 250, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.42149035262807716, 0.4135063206919494, 0.3900532268795741, 0.43729208250166335, 0.48153692614770444]], ["tinyBenchmarks", "mmlu-pro_all", 500, 500, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.41051230871590133, 0.4384564204923483, 0.3567864271457085, 0.46540252827677936, 0.4500998003992013]], ["tinyBenchmarks", "mmlu-pro_all", 1000, 1000, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4060212907518311, 0.4456087824351315, 0.34597471723220335, 0.46224218230206465, 0.46839654025282984]], ["tinyBenchmarks", "mmlu-pro_all", 10, 10, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.33549567531603464, 0.33549567531603464, 0.1909514304723886, 0.407684630738523, 0.33549567531603464]], ["tinyBenchmarks", "mmlu-pro_all", 25, 25, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3918829008649368, 0.3958749168330007, 0.32601463739188297, 0.4958416500332669, 0.43429807052561553]], ["tinyBenchmarks", "mmlu-pro_all", 50, 50, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.47405189620758503, 0.5111443779108452, 0.35379241516966076, 0.5179640718562877, 0.5492348636061212]], ["tinyBenchmarks", "mmlu-pro_all", 100, 100, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4264803725881571, 0.4851962741184299, 0.3637724550898205, 0.47920825016633406, 0.43679308050565535]], ["tinyBenchmarks", "mmlu-pro_all", 250, 250, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.42847638057218906, 0.4667332002661345, 0.3747504990019961, 0.4525948103792416, 0.43895542248835684]], ["tinyBenchmarks", "mmlu-pro_all", 500, 500, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.43113772455089794, 0.4530938123752493, 0.4189953426480369, 0.4738855622089153, 0.456919494344644]], ["tinyBenchmarks", "mmlu-pro_all", 1000, 1000, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4323020625415851, 0.4565868263473069, 0.3875582168995358, 0.4575848303393231, 0.46207584830339493]], ["Stratified_Random_Sampling", "mmlu-pro_all", 10, 10, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.11427145708582834, 0.11427145708582834, 0.427478376580173, 0.11427145708582834, 0.11427145708582834]], ["Stratified_Random_Sampling", "mmlu-pro_all", 10, 10, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.447272122421823, 0.2721224218230206, 0.1712408516300732, 0.3722554890219561, 0.3722554890219561]], ["Stratified_Random_Sampling", "mmlu-pro_all", 10, 10, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3310878243512974, 0.28875582168995345, 0.31694943446440454, 0.3310878243512974, 0.2523286759813706]], ["Stratified_Random_Sampling", "mmlu-pro_all", 10, 10, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.40668662674650696, 0.24916833000665337, 0.2090818363273453, 0.24916833000665337, 0.3278443113772455]], ["Stratified_Random_Sampling", "mmlu-pro_all", 10, 10, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.31320691949434465, 0.4644045242847638, 0.3972055888223553, 0.36909514304723884, 0.4644045242847638]], ["Stratified_Random_Sampling", "mmlu-pro_all", 10, 10, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.1259148369926813, 0.21224218230206254, 0.4706420492348636, 0.3396540252827678, 0.3396540252827678]], ["Stratified_Random_Sampling", "mmlu-pro_all", 10, 10, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.425981370592149, 0.41974384564204925, 0.21340652029274784, 0.41974384564204925, 0.49983366600133067]], ["Stratified_Random_Sampling", "mmlu-pro_all", 10, 10, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.2381902860944777, 0.20326014637391882, 0.3596972721224218, 0.20326014637391882, 0.3369926813040586]], ["Stratified_Random_Sampling", "mmlu-pro_all", 10, 10, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.25482368596141053, 0.43271789753825685, 0.3207751164337991, 0.35196274118429804, 0.43271789753825685]], ["Stratified_Random_Sampling", "mmlu-pro_all", 10, 10, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.23652694610778444, 0.561127744510978, 0.18762475049900199, 0.561127744510978, 0.561127744510978]], ["Stratified_Random_Sampling", "mmlu-pro_all", 25, 25, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.5501497005988024, 0.40198769128409845, 0.4172488356620093, 0.5251580172987359, 0.5671157684630739]], ["Stratified_Random_Sampling", "mmlu-pro_all", 25, 25, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.41304612996229767, 0.4411177644710579, 0.34043025060989135, 0.5232867598137059, 0.5236027944111776]], ["Stratified_Random_Sampling", "mmlu-pro_all", 25, 25, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.5992320913728099, 0.5614188290086493, 0.2824767132401863, 0.6005073186959414, 0.5195026613439786]], ["Stratified_Random_Sampling", "mmlu-pro_all", 25, 25, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4379574184963407, 0.5200266134397871, 0.34565868263473054, 0.43779108449767135, 0.5978043912175649]], ["Stratified_Random_Sampling", "mmlu-pro_all", 25, 25, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.30649811488134837, 0.38073297848746945, 0.29466067864271456, 0.41638944333555106, 0.3758094921268573]], ["Stratified_Random_Sampling", "mmlu-pro_all", 25, 25, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.5022177866489244, 0.5479457751164338, 0.46207862053670434, 0.6321523619427811, 0.505475160789532]], ["Stratified_Random_Sampling", "mmlu-pro_all", 25, 25, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.37159015302727877, 0.49303060545575517, 0.31260811709913505, 0.49303060545575517, 0.4950681969394545]], ["Stratified_Random_Sampling", "mmlu-pro_all", 25, 25, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4454424484364604, 0.43908017298735863, 0.40157185628742514, 0.35254491017964074, 0.4151696606786427]], ["Stratified_Random_Sampling", "mmlu-pro_all", 25, 25, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.30451596806387227, 0.5844311377245509, 0.4100715236194278, 0.5034680638722555, 0.4213656021290752]], ["Stratified_Random_Sampling", "mmlu-pro_all", 25, 25, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.5805195165225104, 0.5383122643601685, 0.4663173652694611, 0.5756958305611, 0.5383122643601685]], ["Stratified_Random_Sampling", "mmlu-pro_all", 50, 50, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.519692757342458, 0.5814026708487786, 0.5213620378291037, 0.6025746126794032, 0.6020188459060715]], ["Stratified_Random_Sampling", "mmlu-pro_all", 50, 50, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4054723885562209, 0.4248096399793007, 0.34320802838766923, 0.5034893176609744, 0.3666916167664671]], ["Stratified_Random_Sampling", "mmlu-pro_all", 50, 50, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4823478043912177, 0.5801799179418942, 0.32129491017964074, 0.5398231315147484, 0.49916833000665345]], ["Stratified_Random_Sampling", "mmlu-pro_all", 50, 50, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4804862497227767, 0.4403380108469929, 0.3806082279884675, 0.43949802415371286, 0.4748253493013973]], ["Stratified_Random_Sampling", "mmlu-pro_all", 50, 50, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.37929696163229093, 0.48303947660235075, 0.45594366821911725, 0.44297793302284316, 0.4635783987580394]], ["Stratified_Random_Sampling", "mmlu-pro_all", 50, 50, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3557560804317291, 0.39896364678051305, 0.3387761514009019, 0.45845715975456497, 0.4171009832187477]], ["Stratified_Random_Sampling", "mmlu-pro_all", 50, 50, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4739479374584165, 0.5167858726990464, 0.39847619575663484, 0.5177838766910624, 0.49474661787536045]], ["Stratified_Random_Sampling", "mmlu-pro_all", 50, 50, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.38497053512023577, 0.44976594430187256, 0.3479378544498305, 0.4857616777027955, 0.4855330344601802]], ["Stratified_Random_Sampling", "mmlu-pro_all", 50, 50, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3103371959784135, 0.39067651733569897, 0.36523527020034, 0.44875942559325793, 0.46978034671397945]], ["Stratified_Random_Sampling", "mmlu-pro_all", 50, 50, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3084378861324969, 0.5723461146490089, 0.43556399106548804, 0.5341912735375809, 0.5059379257358299]], ["Stratified_Random_Sampling", "mmlu-pro_all", 100, 100, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4487351152396061, 0.5289256673932174, 0.36730923836088486, 0.4976236880186332, 0.4679567147755769]], ["Stratified_Random_Sampling", "mmlu-pro_all", 100, 100, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3775282767797739, 0.428798611926474, 0.3684206905206085, 0.4180361499223776, 0.48918432198783285]], ["Stratified_Random_Sampling", "mmlu-pro_all", 100, 100, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.45976647894686795, 0.5009009758261252, 0.37980586446155307, 0.4995906005449417, 0.5092686650508504]], ["Stratified_Random_Sampling", "mmlu-pro_all", 100, 100, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.42750682844836646, 0.4770743600518262, 0.42931268832427044, 0.46763490562734183, 0.4474614367755717]], ["Stratified_Random_Sampling", "mmlu-pro_all", 100, 100, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4464433016323044, 0.49586988261651316, 0.3379156624925149, 0.456247769376929, 0.4462757678470215]], ["Stratified_Random_Sampling", "mmlu-pro_all", 100, 100, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.39683012129993167, 0.5051435742678255, 0.37952387349842437, 0.5339307293024855, 0.3883171106911127]], ["Stratified_Random_Sampling", "mmlu-pro_all", 100, 100, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.39318646995792705, 0.4135736082779497, 0.41140862607304735, 0.4027845027283651, 0.4636237039555405]], ["Stratified_Random_Sampling", "mmlu-pro_all", 100, 100, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4426796147942091, 0.5135657794516547, 0.3531715937991623, 0.5233129517736773, 0.5036821279512368]], ["Stratified_Random_Sampling", "mmlu-pro_all", 100, 100, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.47955826893970355, 0.5392164744584905, 0.3471570747394102, 0.5392596994120922, 0.5588545861493389]], ["Stratified_Random_Sampling", "mmlu-pro_all", 100, 100, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.35707289125452807, 0.4656382224657439, 0.2860113107119095, 0.44480021438604267, 0.5056722067846876]], ["Stratified_Random_Sampling", "mmlu-pro_all", 250, 250, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4000299894386724, 0.46352869326732693, 0.37996536775650097, 0.4797856510078873, 0.44019910710091437]], ["Stratified_Random_Sampling", "mmlu-pro_all", 250, 250, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3980763535310403, 0.4419408600096712, 0.31854644018223177, 0.4659372190545795, 0.477976512833932]], ["Stratified_Random_Sampling", "mmlu-pro_all", 250, 250, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4355173233415867, 0.45136633075333343, 0.39553988683699215, 0.4712449234719602, 0.4836211854967801]], ["Stratified_Random_Sampling", "mmlu-pro_all", 250, 250, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4028023013801457, 0.4709406698616961, 0.33863737172120406, 0.4506681974778803, 0.4709284422607779]], ["Stratified_Random_Sampling", "mmlu-pro_all", 250, 250, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.40967351459357626, 0.48548308825670805, 0.35352233679280565, 0.5055270312725992, 0.465325190003285]], ["Stratified_Random_Sampling", "mmlu-pro_all", 250, 250, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.38545497195197775, 0.4729773226791686, 0.3537056759312245, 0.4529334005519131, 0.47712532976005995]], ["Stratified_Random_Sampling", "mmlu-pro_all", 250, 250, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4269842454840661, 0.4825204678941499, 0.3706856056714762, 0.4825111498524184, 0.5067005217336344]], ["Stratified_Random_Sampling", "mmlu-pro_all", 250, 250, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3902989649838974, 0.4754664518537931, 0.35828858875440117, 0.48726902501620467, 0.46745965180027266]], ["Stratified_Random_Sampling", "mmlu-pro_all", 250, 250, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.37620001699343025, 0.4525300409282444, 0.3607236104990597, 0.4723384760061406, 0.47320915528250845]], ["Stratified_Random_Sampling", "mmlu-pro_all", 250, 250, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.38961986965029766, 0.45739692942569754, 0.38626172046912066, 0.4535097043802455, 0.44581973795882895]], ["Stratified_Random_Sampling", "mmlu-pro_all", 500, 500, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3945067342124444, 0.4645857162337807, 0.3543490756831669, 0.48061278844809796, 0.44858043325837976]], ["Stratified_Random_Sampling", "mmlu-pro_all", 500, 500, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.42495583794075587, 0.4768061464640554, 0.37913529033576926, 0.472807346326835, 0.48289996028095844]], ["Stratified_Random_Sampling", "mmlu-pro_all", 500, 500, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4013098626203675, 0.46121340537958366, 0.3672840419566479, 0.4712721081317975, 0.46135503162237024]], ["Stratified_Random_Sampling", "mmlu-pro_all", 500, 500, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.411860769007989, 0.4759208606458525, 0.35380850324110097, 0.4779469089295114, 0.46790658992384176]], ["Stratified_Random_Sampling", "mmlu-pro_all", 500, 500, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3984987071925172, 0.48643571270536234, 0.3523599876958694, 0.4924903051748444, 0.4944297943293767]], ["Stratified_Random_Sampling", "mmlu-pro_all", 500, 500, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.42019764144683613, 0.44828190233620785, 0.36629521852009655, 0.4582247716413266, 0.4261466316932908]], ["Stratified_Random_Sampling", "mmlu-pro_all", 500, 500, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4086177776204211, 0.4706675400590352, 0.3585978780522342, 0.4667235133470735, 0.4606402316222955]], ["Stratified_Random_Sampling", "mmlu-pro_all", 500, 500, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4007598734841599, 0.43866067714210405, 0.3509303349211294, 0.4446712614233462, 0.46859192879869394]], ["Stratified_Random_Sampling", "mmlu-pro_all", 500, 500, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3952062184857501, 0.461188692010283, 0.36717811815731033, 0.46926353472091364, 0.4732303559129073]], ["Stratified_Random_Sampling", "mmlu-pro_all", 500, 500, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3894875510798019, 0.4636287410006508, 0.3852189135794513, 0.4536693009403226, 0.4435197067662075]], ["Stratified_Random_Sampling", "mmlu-pro_all", 1000, 1000, 300, 0, [0.40901530272787756, 0.46540252827677975, 0.36543579507651364, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4564784053156146, 0.3712624584717608, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3969930970863956, 0.4690357519549799, 0.3780009623807806, 0.4740171734452571, 0.44504986281509656]], ["Stratified_Random_Sampling", "mmlu-pro_all", 1000, 1000, 300, 1, [0.4091816367265469, 0.47005988023952094, 0.3604457751164338, 0.4732202262142382, 0.4644045242847638], [0.4061461794019934, 0.45182724252491696, 0.37624584717607973, 0.4599667774086379, 0.4606312292358804], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.41300125541128657, 0.45701024259162665, 0.3719847045931456, 0.4600183287901612, 0.4730167616192855]], ["Stratified_Random_Sampling", "mmlu-pro_all", 1000, 1000, 300, 2, [0.4098469727212242, 0.46540252827677975, 0.36177644710578843, 0.47005988023952094, 0.4615768463073852], [0.4054817275747508, 0.4564784053156146, 0.37491694352159466, 0.46312292358803986, 0.4634551495016611], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.3981059920249787, 0.4640945351358959, 0.35219486732219846, 0.4571119034747972, 0.4501290442581985]], ["Stratified_Random_Sampling", "mmlu-pro_all", 1000, 1000, 300, 3, [0.4121756487025948, 0.46457085828343314, 0.36793080505655357, 0.46823020625415834, 0.46706586826347307], [0.403156146179402, 0.45730897009966776, 0.3687707641196013, 0.4649501661129568, 0.4579734219269103], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.39335620428160434, 0.450207291078224, 0.3735019768913174, 0.45624420334248655, 0.4851770827844175]], ["Stratified_Random_Sampling", "mmlu-pro_all", 1000, 1000, 300, 4, [0.4106786427145709, 0.46773120425815035, 0.36726546906187624, 0.46706586826347307, 0.46956087824351295], [0.4046511627906977, 0.4541528239202658, 0.36943521594684386, 0.46611295681063125, 0.4554817275747508], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4150834510546192, 0.48804065876390185, 0.35510472818883737, 0.4820492197975673, 0.48207177720172556]], ["Stratified_Random_Sampling", "mmlu-pro_all", 1000, 1000, 300, 5, [0.40635395874916835, 0.4605788423153693, 0.36726546906187624, 0.47005988023952094, 0.46274118429807054], [0.4089700996677741, 0.4612956810631229, 0.36943521594684386, 0.46312292358803986, 0.4622923588039867], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.40836536698379655, 0.4604210474993191, 0.3853495465235326, 0.47545159305370127, 0.44844490525882863]], ["Stratified_Random_Sampling", "mmlu-pro_all", 1000, 1000, 300, 6, [0.40901530272787756, 0.46174318030605455, 0.37491683300066536, 0.4697272122421823, 0.46457085828343314], [0.406312292358804, 0.4601328903654485, 0.3617940199335548, 0.4634551495016611, 0.4604651162790698], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4065331671996377, 0.4665891945948753, 0.37250488149528427, 0.4826137614548634, 0.46156280654730164]], ["Stratified_Random_Sampling", "mmlu-pro_all", 1000, 1000, 300, 7, [0.40652029274783763, 0.4624085163007319, 0.37109115103127077, 0.46706586826347307, 0.4667332002661344], [0.40880398671096346, 0.45946843853820596, 0.36561461794019934, 0.46611295681063125, 0.45830564784053157], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.40142388456183886, 0.45439596636234636, 0.3694030912637366, 0.4454615786795732, 0.46140664620044597]], ["Stratified_Random_Sampling", "mmlu-pro_all", 1000, 1000, 300, 8, [0.3992015968063872, 0.4560878243512974, 0.36593479707252163, 0.46091151031270794, 0.4619095143047239], [0.4161129568106312, 0.46578073089700994, 0.3707641196013289, 0.4722591362126246, 0.46312292358803986], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.39283318029247694, 0.4408209670582779, 0.37188857896676897, 0.44579610971673633, 0.4558050322290172]], ["Stratified_Random_Sampling", "mmlu-pro_all", 1000, 1000, 300, 9, [0.40901530272787756, 0.46107784431137727, 0.37258815701929476, 0.4642381902860945, 0.46091151031270794], [0.406312292358804, 0.46079734219269103, 0.36411960132890364, 0.46893687707641196, 0.4641196013289037], [0.4076628989361702, 0.4609375, 0.3683510638297872, 0.4665890957446808, 0.4625166223404255], [0.4145255102994315, 0.4634108138184505, 0.35767507115817515, 0.47341120230766864, 0.48439516597321647]]]