,Technique,Number of source models,Fraction of sampled points,Average correctness seen (mean),Average correctness unseen (mean)
0,Random (uniform),10,10,0.6300734693877551,0.6289632653061225
1,"Random (subtask stratified, equal)",10,10,0.6265142857142857,0.6252734693877551
2,Diversity,10,10,0.6463673469387755,0.6461224489795918
3,Stratified sampling (confidence),10,10,0.6987959183673469,0.6976530612244898
4,Anchor Points,10,10,0.8213714285714285,0.8196408163265306
5,tinyBenchmarks,10,10,0.726334693877551,0.7263836734693877
6,Random (uniform),10,25,0.7643265306122449,0.7609142857142858
7,"Random (subtask stratified, equal)",10,25,0.7627755102040816,0.7592816326530613
8,Diversity,10,25,0.7591020408163265,0.7576326530612245
9,Stratified sampling (confidence),10,25,0.7887142857142857,0.787530612244898
10,Anchor Points,10,25,0.8654367346938775,0.8649142857142857
11,tinyBenchmarks,10,25,0.8026938775510204,0.8011428571428572
12,Random (uniform),10,50,0.8269387755102041,0.8217142857142857
13,"Random (subtask stratified, equal)",10,50,0.8239020408163266,0.8214530612244898
14,Diversity,10,50,0.8152244897959183,0.8128979591836735
15,Stratified sampling (confidence),10,50,0.8553877551020408,0.8516530612244898
16,Anchor Points,10,50,0.8941551020408163,0.8909551020408163
17,tinyBenchmarks,10,50,0.840930612244898,0.8374857142857143
18,Random (uniform),10,100,0.8741224489795918,0.8690775510204082
19,"Random (subtask stratified, equal)",10,100,0.8780408163265306,0.8744163265306123
20,Diversity,10,100,0.8637755102040816,0.8601020408163266
21,Stratified sampling (confidence),10,100,0.8893265306122449,0.8837755102040816
22,Anchor Points,10,100,0.9100081632653061,0.9078204081632653
23,tinyBenchmarks,10,100,0.8845387755102041,0.8809795918367347
24,Random (uniform),10,250,0.9219918367346939,0.9131428571428571
25,"Random (subtask stratified, equal)",10,250,0.920995918367347,0.9135510204081633
26,Diversity,10,250,0.908734693877551,0.9029183673469388
27,Stratified sampling (confidence),10,250,0.9285102040816327,0.9191020408163265
28,Anchor Points,10,250,0.922873469387755,0.9187591836734694
29,tinyBenchmarks,10,250,0.9199836734693878,0.9127836734693877
30,Random (uniform),10,500,0.9450775510204081,0.9365551020408164
31,"Random (subtask stratified, equal)",10,500,0.9454040816326531,0.9367020408163266
32,Diversity,10,500,0.9238163265306123,0.916795918367347
33,Stratified sampling (confidence),10,500,0.9463469387755102,0.937469387755102
34,Anchor Points,10,500,0.9300408163265306,0.9252408163265307
35,tinyBenchmarks,10,500,0.9413551020408163,0.9318693877551021
36,Random (uniform),10,1000,0.9646204081632653,0.9509224489795919
37,"Random (subtask stratified, equal)",10,1000,0.9659755102040817,0.9523102040816327
38,Diversity,10,1000,0.9426938775510204,0.933469387755102
39,Stratified sampling (confidence),10,1000,0.9685918367346938,0.9538367346938775
40,Anchor Points,10,1000,0.935330612244898,0.9298122448979592
41,tinyBenchmarks,10,1000,0.9592979591836734,0.947134693877551
42,Random (uniform),50,10,0.6355918367346939,0.634269387755102
43,"Random (subtask stratified, equal)",50,10,0.652604081632653,0.6525387755102041
44,Diversity,50,10,0.6243061224489795,0.6238367346938776
45,Stratified sampling (confidence),50,10,0.712204081632653,0.7104081632653061
46,Anchor Points,50,10,0.8578775510204082,0.8548081632653062
47,tinyBenchmarks,50,10,0.7134530612244898,0.7139428571428571
48,Random (uniform),50,25,0.7442775510204082,0.7422040816326531
49,"Random (subtask stratified, equal)",50,25,0.7589551020408163,0.7560979591836735
50,Diversity,50,25,0.7496734693877551,0.7468367346938776
51,Stratified sampling (confidence),50,25,0.8010204081632653,0.7994081632653062
52,Anchor Points,50,25,0.8827102040816327,0.8802285714285715
53,tinyBenchmarks,50,25,0.8113959183673469,0.8073632653061225
54,Random (uniform),50,50,0.8265142857142858,0.8240489795918368
55,"Random (subtask stratified, equal)",50,50,0.8291918367346939,0.8269714285714286
56,Diversity,50,50,0.8191632653061225,0.8149387755102041
57,Stratified sampling (confidence),50,50,0.8536734693877551,0.8490612244897959
58,Anchor Points,50,50,0.9028244897959183,0.8969142857142857
59,tinyBenchmarks,50,50,0.8639673469387755,0.8585469387755102
60,Random (uniform),50,100,0.8760326530612245,0.8711020408163266
61,"Random (subtask stratified, equal)",50,100,0.8801142857142857,0.8741387755102041
62,Diversity,50,100,0.8685306122448979,0.8631020408163266
63,Stratified sampling (confidence),50,100,0.890734693877551,0.8851020408163265
64,Anchor Points,50,100,0.9167673469387755,0.9136326530612245
65,tinyBenchmarks,50,100,0.901469387755102,0.8965877551020408
66,Random (uniform),50,250,0.9208489795918368,0.9139265306122449
67,"Random (subtask stratified, equal)",50,250,0.9251265306122449,0.9162448979591836
68,Diversity,50,250,0.9112040816326531,0.9034897959183673
69,Stratified sampling (confidence),50,250,0.9248979591836735,0.9188979591836735
70,Anchor Points,50,250,0.9270204081632653,0.9224489795918367
71,tinyBenchmarks,50,250,0.9370775510204081,0.9278204081632653
72,Random (uniform),50,500,0.9503510204081632,0.9381387755102041
73,"Random (subtask stratified, equal)",50,500,0.948,0.9373877551020409
74,Diversity,50,500,0.9292857142857143,0.9198163265306123
75,Stratified sampling (confidence),50,500,0.9512448979591837,0.9400612244897959
76,Anchor Points,50,500,0.9336163265306122,0.9276081632653062
77,tinyBenchmarks,50,500,0.9530938775510204,0.9412244897959183
78,Random (uniform),50,1000,0.9646367346938776,0.9501714285714286
79,"Random (subtask stratified, equal)",50,1000,0.9653877551020408,0.9491591836734694
80,Diversity,50,1000,0.9507551020408164,0.9378979591836735
81,Stratified sampling (confidence),50,1000,0.9673673469387755,0.9510816326530612
82,Anchor Points,50,1000,0.936195918367347,0.9292734693877551
83,tinyBenchmarks,50,1000,0.9675755102040816,0.9508897959183673
84,Random (uniform),100,10,0.6389551020408163,0.6366204081632653
85,"Random (subtask stratified, equal)",100,10,0.6397387755102041,0.6373387755102041
86,Diversity,100,10,0.6406938775510204,0.6401428571428571
87,Stratified sampling (confidence),100,10,0.7287959183673469,0.728734693877551
88,Anchor Points,100,10,0.8612571428571428,0.8579918367346939
89,tinyBenchmarks,100,10,0.7271673469387755,0.7236081632653061
90,Random (uniform),100,25,0.7523591836734694,0.7485387755102041
91,"Random (subtask stratified, equal)",100,25,0.7677224489795919,0.7657632653061225
92,Diversity,100,25,0.7375714285714285,0.7367959183673469
93,Stratified sampling (confidence),100,25,0.795469387755102,0.792530612244898
94,Anchor Points,100,25,0.886138775510204,0.8851265306122449
95,tinyBenchmarks,100,25,0.8153959183673469,0.8136163265306122
96,Random (uniform),100,50,0.8267755102040817,0.8240489795918368
97,"Random (subtask stratified, equal)",100,50,0.8237224489795918,0.819330612244898
98,Diversity,100,50,0.8134489795918367,0.8109795918367347
99,Stratified sampling (confidence),100,50,0.8511632653061224,0.8493673469387755
100,Anchor Points,100,50,0.909534693877551,0.9058122448979592
101,tinyBenchmarks,100,50,0.8669714285714286,0.8645061224489796
102,Random (uniform),100,100,0.8820408163265306,0.8785795918367347
103,"Random (subtask stratified, equal)",100,100,0.8788081632653061,0.8742367346938775
104,Diversity,100,100,0.8647551020408163,0.8599183673469388
105,Stratified sampling (confidence),100,100,0.8904285714285715,0.8862244897959184
106,Anchor Points,100,100,0.9237224489795919,0.9196408163265306
107,tinyBenchmarks,100,100,0.9067591836734694,0.9000326530612245
108,Random (uniform),100,250,0.9251755102040816,0.9174857142857142
109,"Random (subtask stratified, equal)",100,250,0.9224979591836735,0.9147918367346939
110,Diversity,100,250,0.9082857142857143,0.9032653061224489
111,Stratified sampling (confidence),100,250,0.9293469387755102,0.9204489795918367
112,Anchor Points,100,250,0.9335346938775511,0.9289632653061225
113,tinyBenchmarks,100,250,0.936734693877551,0.928130612244898
114,Random (uniform),100,500,0.9481306122448979,0.9366857142857142
115,"Random (subtask stratified, equal)",100,500,0.9470693877551021,0.9347428571428571
116,Diversity,100,500,0.9262244897959183,0.9196122448979592
117,Stratified sampling (confidence),100,500,0.947530612244898,0.9372448979591836
118,Anchor Points,100,500,0.9372081632653061,0.9326367346938775
119,tinyBenchmarks,100,500,0.9545469387755102,0.9443265306122449
120,Random (uniform),100,1000,0.965469387755102,0.9518857142857143
121,"Random (subtask stratified, equal)",100,1000,0.9654530612244898,0.9509387755102041
122,Diversity,100,1000,0.9464285714285714,0.9358163265306122
123,Stratified sampling (confidence),100,1000,0.9674489795918367,0.9526734693877551
124,Anchor Points,100,1000,0.9382530612244898,0.9332897959183674
125,tinyBenchmarks,100,1000,0.9688816326530613,0.9546775510204082
126,Random (uniform),150,10,0.6354938775510204,0.6345142857142857
127,"Random (subtask stratified, equal)",150,10,0.6391510204081633,0.637404081632653
128,Diversity,150,10,0.6494897959183673,0.647734693877551
129,Stratified sampling (confidence),150,10,0.7074489795918367,0.706469387755102
130,Anchor Points,150,10,0.8601142857142857,0.8570122448979591
131,tinyBenchmarks,150,10,0.7216163265306123,0.7187755102040816
132,Random (uniform),150,25,0.7570122448979592,0.7557714285714285
133,"Random (subtask stratified, equal)",150,25,0.7596571428571428,0.7566857142857143
134,Diversity,150,25,0.7390816326530613,0.7368571428571429
135,Stratified sampling (confidence),150,25,0.8103265306122449,0.8087142857142857
136,Anchor Points,150,25,0.8911346938775511,0.8873142857142857
137,tinyBenchmarks,150,25,0.8046204081632653,0.8011265306122449
138,Random (uniform),150,50,0.8190857142857143,0.8161306122448979
139,"Random (subtask stratified, equal)",150,50,0.8266775510204082,0.8247020408163265
140,Diversity,150,50,0.8199387755102041,0.8150408163265306
141,Stratified sampling (confidence),150,50,0.8481632653061224,0.8475102040816327
142,Anchor Points,150,50,0.9098285714285714,0.9042775510204082
143,tinyBenchmarks,150,50,0.8599510204081633,0.8561142857142857
144,Random (uniform),150,100,0.8754938775510204,0.8717551020408163
145,"Random (subtask stratified, equal)",150,100,0.873730612244898,0.8685224489795919
146,Diversity,150,100,0.8663061224489796,0.8611428571428571
147,Stratified sampling (confidence),150,100,0.8863673469387755,0.8827551020408163
148,Anchor Points,150,100,0.9237714285714286,0.9176
149,tinyBenchmarks,150,100,0.9043591836734693,0.9003428571428571
150,Random (uniform),150,250,0.9222040816326531,0.9161959183673469
151,"Random (subtask stratified, equal)",150,250,0.9224163265306122,0.9161469387755102
152,Diversity,150,250,0.9122653061224489,0.9036122448979592
153,Stratified sampling (confidence),150,250,0.9288571428571428,0.9210612244897959
154,Anchor Points,150,250,0.9339265306122448,0.9272
155,tinyBenchmarks,150,250,0.9358204081632653,0.9273632653061225
156,Random (uniform),150,500,0.9480326530612245,0.9378122448979592
157,"Random (subtask stratified, equal)",150,500,0.9486530612244898,0.9372408163265306
158,Diversity,150,500,0.9314489795918367,0.9219795918367347
159,Stratified sampling (confidence),150,500,0.9493877551020408,0.940530612244898
160,Anchor Points,150,500,0.9369469387755102,0.9299918367346939
161,tinyBenchmarks,150,500,0.9542367346938776,0.9423183673469387
162,Random (uniform),150,1000,0.9669061224489796,0.9543020408163265
163,"Random (subtask stratified, equal)",150,1000,0.9654367346938776,0.951330612244898
164,Diversity,150,1000,0.9500204081632653,0.9375510204081633
165,Stratified sampling (confidence),150,1000,0.9658571428571429,0.9521836734693877
166,Anchor Points,150,1000,0.9374367346938776,0.931004081632653
167,tinyBenchmarks,150,1000,0.9688,0.9525224489795918
168,Random (uniform),200,10,0.637665306122449,0.6350204081632653
169,"Random (subtask stratified, equal)",200,10,0.6363755102040817,0.6353142857142857
170,Diversity,200,10,0.6057551020408163,0.6026734693877551
171,Stratified sampling (confidence),200,10,0.7132857142857143,0.712204081632653
172,Anchor Points,200,10,0.8609142857142857,0.8610122448979591
173,tinyBenchmarks,200,10,0.7170122448979592,0.7173877551020408
174,Random (uniform),200,25,0.7557224489795918,0.7535836734693877
175,"Random (subtask stratified, equal)",200,25,0.7516408163265306,0.7481469387755102
176,Diversity,200,25,0.7382244897959184,0.7363061224489796
177,Stratified sampling (confidence),200,25,0.8006734693877551,0.7983877551020409
178,Anchor Points,200,25,0.8914612244897959,0.8885551020408163
179,tinyBenchmarks,200,25,0.8091102040816327,0.8075428571428571
180,Random (uniform),200,50,0.8261551020408163,0.822204081632653
181,"Random (subtask stratified, equal)",200,50,0.8319673469387755,0.828865306122449
182,Diversity,200,50,0.8130408163265306,0.8097142857142857
183,Stratified sampling (confidence),200,50,0.8437959183673469,0.8410816326530612
184,Anchor Points,200,50,0.9100408163265307,0.9066122448979592
185,tinyBenchmarks,200,50,0.8621551020408164,0.8573714285714286
186,Random (uniform),200,100,0.8804244897959184,0.8747265306122449
187,"Random (subtask stratified, equal)",200,100,0.8800163265306122,0.8752
188,Diversity,200,100,0.8640408163265306,0.8575306122448979
189,Stratified sampling (confidence),200,100,0.8841224489795918,0.8799183673469387
190,Anchor Points,200,100,0.9218938775510204,0.918465306122449
191,tinyBenchmarks,200,100,0.9009632653061225,0.8952816326530613
192,Random (uniform),200,250,0.9253877551020409,0.9157061224489796
193,"Random (subtask stratified, equal)",200,250,0.9214367346938775,0.912604081632653
194,Diversity,200,250,0.9105510204081633,0.9052448979591837
195,Stratified sampling (confidence),200,250,0.9304081632653062,0.9254081632653062
196,Anchor Points,200,250,0.9311836734693878,0.9268734693877551
197,tinyBenchmarks,200,250,0.9367836734693877,0.9284408163265306
198,Random (uniform),200,500,0.9450612244897959,0.9357551020408164
199,"Random (subtask stratified, equal)",200,500,0.9473632653061225,0.9364571428571429
200,Diversity,200,500,0.9345102040816327,0.9266530612244898
201,Stratified sampling (confidence),200,500,0.950469387755102,0.9421224489795919
202,Anchor Points,200,500,0.9330448979591837,0.928734693877551
203,tinyBenchmarks,200,500,0.9540897959183674,0.9416326530612245
204,Random (uniform),200,1000,0.9656,0.9511836734693877
205,"Random (subtask stratified, equal)",200,1000,0.9661551020408163,0.9505959183673469
206,Diversity,200,1000,0.9523469387755102,0.9410408163265306
207,Stratified sampling (confidence),200,1000,0.9667346938775511,0.9520612244897959
208,Anchor Points,200,1000,0.9350367346938776,0.9300081632653061
209,tinyBenchmarks,200,1000,0.9678530612244898,0.9512163265306123
210,Random (uniform),250,10,0.6434122448979592,0.6406693877551021
211,"Random (subtask stratified, equal)",250,10,0.6356081632653061,0.6321632653061224
212,Diversity,250,10,0.646469387755102,0.6439183673469387
213,Stratified sampling (confidence),250,10,0.717204081632653,0.7156530612244898
214,Anchor Points,250,10,0.8676734693877551,0.867265306122449
215,tinyBenchmarks,250,10,0.7200979591836735,0.7170938775510204
216,Random (uniform),250,25,0.7650285714285714,0.7635428571428572
217,"Random (subtask stratified, equal)",250,25,0.7578285714285714,0.7562122448979591
218,Diversity,250,25,0.7541428571428571,0.7500816326530613
219,Stratified sampling (confidence),250,25,0.803795918367347,0.8028367346938775
220,Anchor Points,250,25,0.8922122448979591,0.8929469387755102
221,tinyBenchmarks,250,25,0.8124081632653061,0.8101387755102041
222,Random (uniform),250,50,0.8300897959183674,0.8257142857142857
223,"Random (subtask stratified, equal)",250,50,0.8340408163265306,0.8330448979591837
224,Diversity,250,50,0.8193061224489796,0.8134489795918367
225,Stratified sampling (confidence),250,50,0.8543469387755102,0.8525510204081632
226,Anchor Points,250,50,0.9119020408163265,0.9119510204081632
227,tinyBenchmarks,250,50,0.859069387755102,0.8547918367346938
228,Random (uniform),250,100,0.8814857142857143,0.8767673469387756
229,"Random (subtask stratified, equal)",250,100,0.8761469387755102,0.8709224489795918
230,Diversity,250,100,0.8661224489795918,0.8619591836734694
231,Stratified sampling (confidence),250,100,0.8873265306122449,0.8837142857142857
232,Anchor Points,250,100,0.9224,0.921338775510204
233,tinyBenchmarks,250,100,0.8980571428571429,0.8931265306122449
234,Random (uniform),250,250,0.9235102040816326,0.9159673469387755
235,"Random (subtask stratified, equal)",250,250,0.920065306122449,0.9138122448979592
236,Diversity,250,250,0.9101224489795918,0.9036326530612245
237,Stratified sampling (confidence),250,250,0.9258775510204081,0.920265306122449
238,Anchor Points,250,250,0.9346448979591837,0.931461224489796
239,tinyBenchmarks,250,250,0.9381224489795918,0.9286040816326531
240,Random (uniform),250,500,0.9468734693877551,0.9363918367346938
241,"Random (subtask stratified, equal)",250,500,0.9490285714285714,0.9392163265306123
242,Diversity,250,500,0.9331632653061225,0.9241632653061225
243,Stratified sampling (confidence),250,500,0.9485510204081633,0.938204081632653
244,Anchor Points,250,500,0.9360979591836734,0.9336326530612244
245,tinyBenchmarks,250,500,0.9548897959183673,0.940734693877551
246,Random (uniform),250,1000,0.967134693877551,0.9514775510204082
247,"Random (subtask stratified, equal)",250,1000,0.9642122448979592,0.9503673469387756
248,Diversity,250,1000,0.9495714285714286,0.9388163265306122
249,Stratified sampling (confidence),250,1000,0.9661020408163266,0.9496734693877551
250,Anchor Points,250,1000,0.9374530612244898,0.9349551020408163
251,tinyBenchmarks,250,1000,0.9688326530612245,0.9532244897959183
252,Random (uniform),300,10,0.635934693877551,0.6349224489795918
253,"Random (subtask stratified, equal)",300,10,0.6335836734693877,0.6312163265306122
254,Diversity,300,10,0.641795918367347,0.6389591836734694
255,Stratified sampling (confidence),300,10,0.7065714285714285,0.7029591836734694
256,Anchor Points,300,10,0.8663836734693877,0.8668571428571429
257,tinyBenchmarks,300,10,0.7266285714285714,0.7256
258,Random (uniform),300,25,0.7518367346938776,0.7510530612244898
259,"Random (subtask stratified, equal)",300,25,0.7596081632653061,0.7577632653061225
260,Diversity,300,25,0.7499591836734694,0.7475918367346939
261,Stratified sampling (confidence),300,25,0.8048979591836735,0.8053877551020409
262,Anchor Points,300,25,0.8952979591836735,0.8940734693877551
263,tinyBenchmarks,300,25,0.8054530612244898,0.8024489795918367
264,Random (uniform),300,50,0.8300897959183674,0.8275102040816327
265,"Random (subtask stratified, equal)",300,50,0.8281142857142857,0.8260081632653061
266,Diversity,300,50,0.8209183673469388,0.8180816326530612
267,Stratified sampling (confidence),300,50,0.8554489795918367,0.8523673469387755
268,Anchor Points,300,50,0.9101714285714285,0.9075102040816326
269,tinyBenchmarks,300,50,0.8621387755102041,0.8584979591836734
270,Random (uniform),300,100,0.8764408163265306,0.8746938775510205
271,"Random (subtask stratified, equal)",300,100,0.8772081632653062,0.8725877551020408
272,Diversity,300,100,0.8757959183673469,0.8713673469387755
273,Stratified sampling (confidence),300,100,0.8885918367346939,0.8859795918367347
274,Anchor Points,300,100,0.9266122448979592,0.9219265306122449
275,tinyBenchmarks,300,100,0.9021224489795918,0.8967836734693878
276,Random (uniform),300,250,0.9253877551020409,0.9175020408163266
277,"Random (subtask stratified, equal)",300,250,0.9234775510204082,0.919069387755102
278,Diversity,300,250,0.9159795918367347,0.9102857142857143
279,Stratified sampling (confidence),300,250,0.9294897959183673,0.9223469387755102
280,Anchor Points,300,250,0.9339102040816326,0.9282448979591836
281,tinyBenchmarks,300,250,0.9366204081632653,0.9281142857142857
282,Random (uniform),300,500,0.9469714285714286,0.9376326530612245
283,"Random (subtask stratified, equal)",300,500,0.9458938775510204,0.9379265306122448
284,Diversity,300,500,0.9333469387755102,0.9251428571428572
285,Stratified sampling (confidence),300,500,0.9510408163265306,0.9407551020408164
286,Anchor Points,300,500,0.935134693877551,0.9294040816326531
287,tinyBenchmarks,300,500,0.9536816326530613,0.9429714285714286
288,Random (uniform),300,1000,0.9648163265306122,0.950073469387755
289,"Random (subtask stratified, equal)",300,1000,0.9642775510204081,0.9497795918367347
290,Diversity,300,1000,0.9525102040816327,0.9413877551020409
291,Stratified sampling (confidence),300,1000,0.9691224489795919,0.9552448979591837
292,Anchor Points,300,1000,0.9369306122448979,0.9308081632653061
293,tinyBenchmarks,300,1000,0.9664979591836734,0.9523918367346939
