Model,Dimension (D),Num Tokens,d/D @ 50%,d @ 50%,d/D @ 60%,d @ 60%,d/D @ 70%,d @ 70%,d/D @ 80%,d @ 80%,d/D @ 90%,d @ 90%
ViT-Tiny,192,196000,0.505208,97,0.604167,116,0.703125,135,0.796875,153,0.901042,173
CaiT-S24,384,196000,0.500000,192,0.598958,230,0.703125,270,0.804688,309,0.901042,346
DeiT-Small,384,196000,0.502604,193,0.601562,231,0.700521,269,0.796875,306,0.901042,346
ViT-Large,1024,196000,0.500000,512,0.598633,613,0.700195,717,0.800781,820,0.899414,921
ViT-Huge,1280,256000,0.493750,632,0.592969,759,0.694531,889,0.800000,1024,0.900781,1153
Swin-Small,768,49000,0.501302,385,0.598958,460,0.700521,538,0.799479,614,0.901042,692
"ViT-Base (CLIP, OpenAI)",768,196000,0.500000,384,0.596354,458,0.697917,536,0.804688,618,0.901042,692
"ViT-Large (CLIP, OpenAI)",1024,256000,0.499023,511,0.601562,616,0.696289,713,0.801758,821,0.900391,922
ViT-Base (DINOv2),768,256000,0.500000,384,0.600260,461,0.701823,539,0.802083,616,0.899740,691
ViT-Large (DINOv2),1024,256000,0.497070,509,0.599609,614,0.699219,716,0.798828,818,0.899414,921
ViT-Base (DINO),768,196000,0.496094,381,0.597656,459,0.700521,538,0.798177,613,0.901042,692
ViT-Small (DINO),384,196000,0.476562,183,0.583333,224,0.690104,265,0.791667,304,0.895833,344
ViT-Base (MAE),768,196,0.493490,379,0.588542,452,0.684896,526,0.789062,606,0.895833,688
ViT-Large (MAE),1024,196000,0.500000,512,0.596680,611,0.697266,714,0.797852,817,0.900391,922
