Language,GPT-2,r50k_base,p50k_base,p50k_edit,cl100k_base,RoBERTa,GottBERT,CamemBERT,PhoBERT,RoCBert,XLM-RoBERTa,M2M100,MBart50,mT5,FlanT5,ByT5,CANINE,BLOOM,ArabicBERT,MuRIL,UTF-32,BERT Japanese
Acehnese (Arabic script),0,0,0,0,0,33,51,72412,44386,58680,8402,8708,8402,2548,72462,51,29,18,10234,31525,0,48267
Acehnese (Latin script),0,0,0,0,0,1,1,767,613,0,15,15,14,14,260,4,4,1,0,0,0,0
Mesopotamian Arabic,0,0,0,0,0,9,16,62312,25190,56858,160,185,159,194,62345,16,9,2,0,0,0,40926
Ta’izzi-Adeni Arabic,0,0,0,0,0,7,12,63688,25934,57505,13,15,12,15,63722,12,7,1,0,0,0,41905
Tunisian Arabic,0,0,0,0,0,25,46,62403,25404,56554,84,95,83,99,62441,46,26,7,0,0,0,41113
Afrikaans,0,0,0,0,0,0,0,21,425,52,0,0,0,0,184,2,2,0,0,0,0,1902
South Levantine Arabic,0,0,0,0,0,27,49,61432,22812,54870,13,15,13,16,61495,50,28,7,0,0,0,41268
Akan,0,0,0,0,0,1,1,11077,11553,39854,1863,2245,1863,0,14457,3,3,1,34973,28425,0,8129
Tosk Albanian,0,0,0,0,0,4,4,22,46,0,8,8,7,9,13613,9,9,3,0,0,0,43191
Amharic,0,0,0,0,0,4,4,54244,133564,39797,0,0,0,0,54251,5,2,3,38470,38198,0,35237
North Levantine Arabic,0,0,0,0,0,6,12,59206,21973,54205,5,6,5,6,59261,12,7,1,0,0,0,38713
Standard Arabic,0,0,0,0,0,7,12,64860,27130,58231,11,13,11,13,64893,12,7,1,0,0,0,41914
Standard Arabic (Romanized),0,0,0,0,0,6,6,153,289,0,107,111,106,105,182,14,14,5,0,0,0,0
Najdi Arabic,0,0,0,0,0,6,10,65159,27035,58338,3,3,2,3,65195,10,6,1,0,0,0,42310
Moroccan Arabic,0,0,0,0,0,16,30,63085,24299,56753,7,8,6,7,63119,30,17,5,0,0,0,42240
Egyptian Arabic,0,0,0,0,0,24,44,64312,21942,57565,62,73,62,74,64321,45,25,6,0,0,0,42596
Assamese,0,0,0,0,0,72,92,67224,203690,44736,0,10599,0,0,67220,92,35,10,44032,0,0,41991
Asturian,0,0,0,0,0,1,1,2330,744,16,161,155,161,178,1195,3,3,0,0,0,0,0
Awadhi,0,0,0,0,0,76,130,80663,102099,55281,84,133,84,109,80692,130,51,15,55634,0,0,51847
Central Aymara,0,0,0,0,0,3,3,2188,764,4028,0,0,0,0,1870,8,8,3,0,2708,0,1372
South Azerbaijani,0,0,0,0,0,25,40,59815,21286,49334,58,77,58,63,59832,40,22,9,422,327,0,53753
North Azerbaijani,0,0,0,0,0,0,0,24740,260,37378,24,30,24,31,23234,0,0,0,0,18644,0,27247
Bashkir,0,0,0,0,0,6,5,91578,41282,65009,126,18,126,24,62082,9,5,3,63661,57054,0,40517
Bambara,0,0,0,0,0,10,10,11132,5869,34610,495,290,494,273,14065,19,18,7,29938,25704,0,10326
Balinese,0,0,0,0,0,2,2,99,111,0,61,64,61,66,111,7,7,1,0,0,0,0
Belarusian,0,0,0,0,0,1,1,115654,7287,28620,11,19,11,13,70749,1,1,0,0,68541,0,48756
Bemba,0,0,0,0,0,2,2,40,99,0,17,25,17,16,41,6,6,1,0,0,0,0
Bengali,0,0,0,0,0,41,55,66457,209756,43950,0,0,0,0,66463,55,21,5,43201,0,0,40798
Bhojpuri,0,0,0,0,0,22,37,82006,106412,55561,0,0,0,0,81988,38,15,4,53363,0,0,53619
Banjar (Arabic script),0,0,0,0,0,16,27,68263,33614,61564,5449,5810,5449,798,68380,27,15,8,3116,29477,0,43573
Banjar (Latin script),0,0,0,0,0,0,0,25,83,0,9,9,9,9,22,1,1,0,0,0,0,0
Standard Tibetan,0,0,0,0,0,10,11,9676,46457,75232,38548,9620,38549,1013,9663,11,4,4,145917,74732,0,191521
Bosnian,0,0,0,0,0,4,4,3009,98,0,17,20,17,22,3570,11,11,4,0,11238,0,9420
Buginese,0,0,0,0,0,25,25,173,301,0,124,143,124,130,209,61,60,19,0,0,0,702
Bulgarian,0,0,0,0,0,0,0,104190,360,25783,0,0,0,0,28435,0,0,0,0,52600,0,47522
Catalan,0,0,0,0,0,1,1,945,94,0,8,8,8,9,739,4,4,0,0,1167,0,2482
Cebuano,0,0,0,0,0,0,0,15,44,0,0,18,0,0,9,2,2,0,0,0,0,0
Czech,0,0,0,0,0,1,1,13385,422,0,3,3,3,3,13430,2,2,0,0,29227,0,33564
Chokwe,0,0,0,0,0,1,1,158,110,0,6,7,6,6,92,4,4,1,0,0,0,0
Central Kurdish,0,0,0,0,0,8,10,66162,71597,44196,15,22,14,12,66160,10,6,4,8747,42684,0,40565
Crimean Tatar,0,0,0,0,0,1,1,12264,2340,47102,291,311,291,308,10569,3,3,1,0,17552,0,25277
Welsh,0,0,0,0,0,0,0,102,237,0,9,11,8,11,152,1,1,0,0,0,0,672
Danish,0,0,0,0,0,1,1,2633,314,0,180,197,180,207,3068,4,4,1,0,0,0,11963
German,0,0,0,0,0,2,1,1824,54,0,4,5,4,5,21,8,8,2,0,939,0,893
Southwestern Dinka,0,0,0,0,0,24,23,10818,2749,13902,335,1664,335,328,15436,46,41,17,20427,22162,0,22574
Dyula,0,0,0,0,0,7,8,355,271,837,8,13,7,8,456,19,18,6,815,771,0,729
Dzongkha,0,0,0,0,0,0,0,25862,49382,83470,52752,25939,52753,1520,25867,0,0,0,162528,83445,0,67675
Greek,0,0,0,0,0,3,3,81304,17717,13169,125,145,124,155,81369,5,3,1,0,56654,0,66726
English,0,0,0,0,0,0,0,13,25,0,0,142,0,0,5,3,3,0,0,0,0,0
Esperanto,0,0,0,0,0,0,0,1931,2016,0,0,176,0,0,2256,2,2,0,0,10011,0,13078
Estonian,0,0,0,0,0,2,2,3310,57,0,4,4,3,4,1500,5,5,1,0,7388,0,12244
Basque,0,0,0,0,0,0,0,35,118,0,10,11,10,11,31,0,0,0,0,0,0,0
Ewe,0,0,0,0,0,6,6,13089,9286,34818,225,896,225,131,15956,10,10,4,33260,30372,0,22175
Faroese,0,0,0,0,0,0,0,9856,2326,33540,19,20,19,20,8865,1,1,0,0,18629,0,30261
Fijian,0,0,0,0,0,1,2,13,51,0,1,21,1,1,10,5,5,1,0,0,0,0
Finnish,0,0,0,0,0,0,0,4881,55,0,14,16,14,15,59,0,0,0,0,0,0,0
Fon,0,0,0,0,0,34,35,35697,20951,47668,3488,3617,3488,3472,40964,53,43,19,48264,48699,0,40399
French,0,0,0,0,0,3,3,23,327,0,18,19,17,21,50,9,9,1,0,0,0,5586
Friulian,0,0,0,0,0,1,1,147,247,0,14,14,14,15,167,4,4,1,0,3654,0,6678
Nigerian Fulfulde,0,0,0,0,0,30,31,1945,2012,14031,41,25,41,25,2327,72,71,25,7815,5807,0,205
West Central Oromo,0,0,0,0,0,25,26,35,969,0,19,19,19,20,44,60,60,22,0,0,0,0
Scottish Gaelic,0,0,0,0,0,1,1,1313,408,0,28,36,27,32,1701,4,4,1,0,6632,0,10296
Irish,0,0,0,0,0,0,0,7182,67,0,12,13,12,15,4695,2,2,0,0,0,0,3291
Galician,0,0,0,0,0,0,0,2185,32,0,0,0,0,0,1157,1,1,0,0,0,0,807
Guarani,0,0,0,0,0,5,6,6125,1107,0,171,173,171,178,5692,12,12,4,0,8640,0,18639
Gujarati,0,0,0,0,0,57,57,71251,198466,46246,68,85,68,91,71234,57,22,6,45433,0,0,45108
Haitian Creole,0,0,0,0,0,3,4,839,62,0,23,27,23,22,1059,9,9,3,0,3648,0,5005
Hausa,0,0,0,0,0,3,3,762,843,7976,4,2,4,2,968,9,9,3,4053,3017,0,2286
Hebrew,0,0,0,0,0,2,3,59590,46038,40670,15,17,14,17,59587,3,2,1,0,38960,0,38802
Hindi,0,0,0,0,0,22,38,82824,108675,55619,0,0,0,0,82837,38,15,3,54800,0,0,53644
Chhattisgarhi,0,0,0,0,0,15,25,79961,108976,55671,2,2,2,2,80154,25,10,3,53206,0,0,52079
Croatian,0,0,0,0,0,2,2,3113,275,0,114,127,114,149,3793,6,6,2,0,11260,0,9217
Hungarian,0,0,0,0,0,1,1,10008,334,0,23,27,23,27,2980,3,3,1,0,8711,0,19524
Armenian,0,0,0,0,0,0,0,68871,205568,45044,0,0,0,0,68876,0,0,0,43896,43697,0,42716
Igbo,0,0,0,0,0,9,9,13002,536,0,85,72,85,76,16823,16,14,4,0,28544,0,36136
Ilocano,0,0,0,0,0,7,7,37,61,0,15,14,15,16,40,19,19,6,0,0,0,0
Indonesian,0,0,0,0,0,1,1,88,105,0,35,39,35,44,119,5,5,0,0,0,0,0
Icelandic,0,0,0,0,0,5,5,13802,4095,45879,14,15,13,15,11983,12,11,4,6810,26329,0,39261
Italian,0,0,0,0,0,1,1,107,53,0,0,0,0,0,116,4,4,1,0,406,0,1207
Javanese,0,0,0,0,0,0,0,12,35,0,0,0,0,0,6,2,2,0,0,0,0,0
Japanese,0,0,0,0,0,1,2,7391,16460,0,0,30,0,0,7358,2,1,0,2547,60534,0,0
Kabyle,0,0,0,0,0,20,21,5714,3305,15304,246,391,246,39,7353,42,40,16,9709,20545,0,16668
Jingpho,0,0,0,0,0,0,0,481,433,0,384,373,383,390,659,2,2,0,0,0,0,0
Kamba,0,0,0,0,0,0,0,4319,139,0,0,14,0,0,5671,0,0,0,0,14365,0,20215
Kannada,0,0,0,0,0,103,104,60069,229800,36999,512,630,512,598,60063,105,39,9,35957,299,0,37664
Kashmiri (Arabic script),0,0,0,0,0,2,3,72968,83788,55976,2021,6281,2021,485,72969,3,2,0,11782,0,0,45907
Kashmiri (Devanagari script),0,0,0,0,0,106,177,74882,104264,56977,0,0,0,0,75039,179,72,28,54201,0,0,51052
Georgian,0,0,0,0,0,10,10,63938,188128,41733,1,6,0,1,63848,10,4,3,40021,39756,0,39922
Kazakh,0,0,0,0,0,1,1,94462,21403,65826,21,25,21,24,58859,1,1,0,58382,58604,0,38720
Kabiyè,0,0,0,0,0,9,9,45664,47529,72300,488,292,487,251,56029,12,10,6,56360,49692,0,37505
Kabuverdianu,0,0,0,0,0,0,0,1004,73,0,17,19,16,17,500,1,1,0,0,0,0,2279
Halh Mongolian,0,0,0,0,0,0,0,102653,13781,57071,1,2,1,1,71186,0,0,0,34951,66188,0,42349
Khmer,0,0,0,0,0,0,0,51236,153846,24820,543,698,543,529,51373,0,0,0,18796,16670,0,90387
Kikuyu,0,0,0,0,0,2,3,17350,234,0,173,173,173,179,22134,5,5,2,0,39484,0,51995
Kinyarwanda,0,0,0,0,0,7,7,45,1370,0,25,25,24,24,48,17,17,4,0,0,0,0
Kyrgyz,0,0,0,0,0,1,1,96839,15841,37063,9,29,8,11,50128,1,1,0,29215,63920,0,39173
Kimbundu,0,0,0,0,0,1,1,125,113,0,2,6,1,1,92,3,3,1,0,0,0,0
Northern Kurdish,0,0,0,0,0,3,4,1231,4537,0,4,6,4,5,113,8,8,3,0,27333,0,43682
Central Kanuri (Arabic script),0,0,0,0,0,99,163,60221,74045,52348,102,107,102,93,60184,165,91,44,16219,0,0,38521
Central Kanuri (Latin script),0,0,0,0,0,3,3,6780,5699,41760,23,23,22,22,8614,7,7,2,26356,19662,0,21756
Kikongo,0,0,0,0,0,0,0,36,51,0,23,22,22,23,50,2,2,0,0,0,0,0
Korean,0,0,0,0,0,2,2,47471,59209,0,12,43,12,11,47473,2,1,1,0,33662,0,33935
Lao,0,0,0,0,0,51,51,25699,142816,26844,0,0,0,0,25644,52,19,34,19870,17260,0,95049
Ligurian,0,0,0,0,0,2,2,2096,1183,0,13,13,13,14,2512,5,5,1,0,3888,0,15071
Limburgish,0,0,0,0,0,2,1,697,1035,1033,17,17,16,17,232,5,5,1,0,0,0,2182
Lingala,0,0,0,0,0,1,1,16,19,0,0,0,0,0,20,3,3,0,0,0,0,0
Lithuanian,0,0,0,0,0,1,1,7668,3578,0,1,3,1,1,9106,3,3,1,0,26564,0,33236
Lombard,0,0,0,0,0,1,1,2395,1617,1941,13,12,12,14,1915,3,3,1,0,9517,0,14334
Latgalian,0,0,0,0,0,1,2,7973,1283,0,35,36,35,36,9574,4,4,1,0,11694,0,14664
Luxembourgish,0,0,0,0,0,0,0,897,61,0,0,0,0,0,1025,2,2,0,0,0,0,8436
Luba-Kasai,0,0,0,0,0,0,0,9,127,0,0,0,0,0,5,2,2,0,0,0,0,0
Ganda,0,0,0,0,0,17,17,48,627,0,27,27,26,26,53,40,40,13,0,0,0,0
Luo,0,0,0,0,0,10,10,20,54,0,8,8,7,7,19,26,26,8,0,0,0,0
Mizo,0,0,0,0,0,8,9,237,222,0,163,164,163,171,306,22,22,7,0,0,0,186
Standard Latvian,0,0,0,0,0,0,0,12197,1319,0,2,3,2,2,14538,1,1,0,0,20741,0,14865
Magahi,0,0,0,0,0,21,35,79528,110755,54316,0,0,0,0,79554,35,14,4,52081,0,0,51200
Maithili,0,0,0,0,0,6,10,78666,114079,53664,0,0,0,0,78660,10,4,1,52602,0,0,50323
Malayalam,0,0,0,0,0,40,40,57395,254044,35594,124,158,124,135,57386,41,15,3,34545,0,0,35631
Marathi,0,0,0,0,0,14,23,66585,100140,42219,165,199,164,227,66593,23,9,2,42583,0,0,41200
Minangkabau (Arabic script),0,0,0,0,0,4,7,69823,49414,61401,4707,4908,4707,346,69859,7,4,2,963,31231,0,44671
Minangkabau (Latin script),0,0,0,0,0,1,1,30,51,0,10,10,10,10,27,3,3,0,0,0,0,0
Macedonian,0,0,0,0,0,7,7,106577,2710,27937,11,12,10,13,24790,12,7,3,27239,55119,0,46684
Maltese,0,0,0,0,0,1,1,5297,4516,15435,2,49,2,2,6513,3,3,1,7981,18563,0,24489
Meitei (Bengali script),0,0,0,0,0,14,18,66052,223058,43614,0,0,0,0,66034,18,7,3,42924,0,0,40692
Mossi,0,0,0,0,0,24,24,8158,3034,13643,114,122,113,126,11292,48,45,19,8472,17764,0,22703
Maori,0,0,0,0,0,2,2,6818,83,0,36,35,35,35,9585,6,6,2,0,4298,0,3497
Burmese,0,0,0,0,0,0,0,39357,292405,29241,28,55,27,27,39352,0,0,0,27679,27130,0,34767
Dutch,0,0,0,0,0,10,9,49,41,0,17,19,17,19,143,28,28,8,0,0,0,675
Norwegian Nynorsk,0,0,0,0,0,0,0,2318,54,0,12,13,12,13,2717,1,1,0,0,0,0,7667
Norwegian Bokmål,0,0,0,0,0,1,1,2216,28,0,2,2,2,2,2607,5,5,1,0,0,0,7948
Nepali,0,0,0,0,0,3,5,62802,93877,42607,5,6,5,7,62797,5,2,0,41537,0,0,38843
Northern Sotho,0,0,0,0,0,2,2,3089,57,0,10,9,9,9,3943,5,5,1,0,0,0,411
Nuer,0,0,0,0,0,39,39,36430,28868,57701,797,862,796,602,39144,61,50,26,46217,52527,0,31296
Nyanja,0,0,0,0,0,25,26,64,117,0,38,39,38,35,72,62,62,20,0,0,0,0
Occitan,0,0,0,0,0,1,1,999,350,0,0,0,0,0,994,3,3,0,0,3398,0,5508
Odia,0,0,0,0,0,44,45,67173,219747,44066,0,0,0,0,67190,45,17,4,42994,0,0,41732
Pangasinan,0,0,0,0,0,3,4,37,44,0,18,18,17,18,39,11,11,3,0,0,0,0
Eastern Panjabi,0,0,0,0,0,12,20,82639,203489,56972,0,0,0,0,82645,20,8,2,55584,0,0,53497
Papiamento,0,0,0,0,0,0,0,1883,107,0,10,25,9,10,1069,1,1,0,0,1131,0,2248
Southern Pashto,0,0,0,0,0,113,170,81700,43535,62110,36,42,35,47,81818,172,99,54,28255,25594,0,55616
Western Persian,0,0,0,0,0,6,10,78651,29308,59368,29,32,28,38,78701,10,6,2,255,126,0,55392
Plateau Malagasy,0,0,0,0,0,8,8,36,1598,0,7,9,6,7,35,19,19,6,0,0,0,0
Polish,0,0,0,0,0,0,0,8171,1085,20592,0,10,0,0,8271,0,0,0,0,25030,0,30679
Portuguese,0,0,0,0,0,2,2,1780,97,0,42,46,42,53,1462,6,6,1,0,863,0,9395
Dari,0,0,0,0,0,3,5,76366,26408,59780,24,30,23,31,76384,5,3,1,0,0,0,50074
Ayacucho Quechua,0,0,0,0,0,3,3,636,58,0,1,1,1,1,628,8,8,2,0,0,0,1293
Romanian,0,0,0,0,0,0,0,5123,74,0,23,26,23,28,38,2,2,0,0,24407,0,31186
Rundi,0,0,0,0,0,1,1,23,384,912,0,0,0,0,18,3,3,0,0,0,0,0
Russian,0,0,0,0,0,5,5,107196,386,20500,14,15,14,16,38258,9,5,2,0,59432,0,44800
Sango,0,0,0,0,0,16,17,755,252,0,30,29,29,32,619,41,40,13,0,796,0,4513
Sanskrit,0,0,0,0,0,29,48,58919,97112,39209,100,150,100,127,58912,48,18,6,37868,0,0,36299
Santali,0,0,0,0,0,19,19,80325,223923,52093,80318,80306,80319,111559,80357,21,8,19,51985,51956,0,50203
Sicilian,0,0,0,0,0,4,4,1283,1473,0,5,10,5,5,1597,10,10,3,0,9170,0,15001
Shan,0,0,0,0,0,0,0,37045,310571,38963,193,216,193,157,36568,0,0,0,28878,24948,0,83618
Sinhala,0,0,0,0,0,12,13,74983,210289,46130,52,66,52,70,74987,13,5,8,44954,44781,0,50033
Slovak,0,0,0,0,0,2,2,9990,304,0,1,1,1,1,9525,4,4,1,0,24351,0,27466
Slovenian,0,0,0,0,0,3,3,2613,33,0,2,2,2,2,3158,7,7,2,0,11701,0,7680
Samoan,0,0,0,0,0,3,3,944,2471,2385,20,20,20,22,1284,8,8,3,0,0,0,0
Shona,0,0,0,0,0,4,4,25,75,0,13,14,13,12,26,10,10,3,0,0,0,0
Sindhi,0,0,0,0,0,5,8,78272,50004,63856,4,4,3,5,78287,8,5,2,21113,0,0,51693
Somali,0,0,0,0,0,8,9,20,66,0,7,7,7,8,19,21,21,7,0,0,0,0
Southern Sotho,0,0,0,0,0,2,2,39,95,0,18,17,18,17,39,7,7,2,0,0,0,0
Spanish,0,0,0,0,0,0,0,1850,57,0,19,20,19,23,878,0,0,0,0,0,0,532
Sardinian,0,0,0,0,0,1,1,634,732,0,14,14,14,15,790,3,3,0,0,4031,0,7013
Serbian,0,0,0,0,0,3,3,100697,4561,46346,14,16,14,17,30038,5,3,1,44212,59356,0,44880
Swati,0,0,0,0,0,1,1,34,58,0,18,34,18,17,41,3,3,0,0,0,0,0
Sundanese,0,0,0,0,0,4,4,36,52,0,16,16,15,17,35,12,12,3,0,0,0,0
Swedish,0,0,0,0,0,2,2,4501,72,0,24,26,23,27,1594,7,7,2,0,0,0,10740
Swahili,0,0,0,0,0,2,3,5,53,0,0,1,0,0,1,7,7,1,0,0,0,0
Silesian,0,0,0,0,0,0,0,6967,70,16664,5,47,5,5,8456,1,1,0,0,12884,0,21011
Tamil,0,0,0,0,0,54,54,62397,258155,39576,65,80,64,66,62383,54,20,4,38399,0,0,37981
Tamasheq (Latin script),0,0,0,0,0,186,189,7770,5296,26225,392,744,392,256,6890,389,365,149,15623,21863,0,24072
Tamasheq (Tifinagh script),0,0,0,0,0,803,804,86417,172810,67294,86323,86062,86324,18297,72463,869,358,603,43930,65052,0,65454
Tatar,0,0,0,0,0,1,1,91462,24841,60573,22,53,22,1,54987,1,1,0,58319,64804,0,40483
Telugu,0,0,0,0,0,70,71,61719,213152,40698,174,72325,174,203,61655,71,27,7,38692,310,0,39309
Tajik,0,0,0,0,0,2,2,119854,14972,53661,792,2330,792,8,39298,3,2,1,11361,68662,0,48660
Tagalog,0,0,0,0,0,1,1,334,326,0,202,222,201,226,419,5,5,1,0,0,0,0
Thai,0,0,0,0,0,1,2,16433,7198,14188,0,0,0,0,16437,2,1,0,18246,10177,0,114630
Tigrinya,0,0,0,0,0,11,11,59659,136081,43361,11,180,11,3,59664,12,5,7,42306,42187,0,39215
Tok Pisin,0,0,0,0,0,164,173,206,204,522,145,148,145,153,237,469,469,144,191,156,0,181
Tswana,0,0,0,0,0,1,2,26,58,0,2,7,2,2,25,5,5,1,0,0,0,0
Tsonga,0,0,0,0,0,2,2,36,332,0,17,19,17,17,39,6,6,2,0,0,0,0
Turkmen,0,0,0,0,0,1,1,12894,44,0,2,38,2,2,7913,3,3,1,0,33971,0,44029
Tumbuka,0,0,0,0,0,7,8,1885,1779,0,16,17,16,15,2412,18,18,6,0,11741,0,16654
Turkish,0,0,0,0,0,1,1,10387,135,43711,12,14,12,14,7381,3,3,1,0,17744,0,26381
Twi,0,0,0,0,0,17,18,9172,7449,31161,145,155,145,34,11976,35,33,12,29610,23680,0,6265
Central Atlas Tamazight,0,0,0,0,0,44,44,73496,179054,48970,73394,73366,73394,76,73503,48,19,33,44801,47591,0,47613
Uyghur,0,0,0,0,0,5,7,62341,78689,43735,3,11832,3,6,62322,7,4,2,37244,51973,0,38186
Ukrainian,0,0,0,0,0,3,3,101271,4615,24072,33,38,33,40,48721,5,3,1,0,63694,0,43662
Umbundu,0,0,0,0,0,16,17,1318,1114,0,12,14,11,12,1674,39,38,13,0,2146,0,7131
Urdu,0,0,0,0,0,1,1,84554,69318,64423,0,3,0,0,84601,1,1,0,0,0,0,56167
Northern Uzbek,0,0,0,0,0,0,0,6,46,0,0,0,0,0,8,2,2,0,0,0,0,0
Venetian,0,0,0,0,0,2,2,2340,602,20799,15,21,14,16,2689,6,6,1,0,1204,0,4073
Vietnamese,0,0,0,0,0,0,0,29900,25,0,0,0,0,0,33486,0,0,0,0,54562,0,60711
Waray,0,0,0,0,0,0,0,30,42,0,13,23,12,13,29,2,2,0,0,0,0,0
Wolof,0,0,0,0,0,3,3,1366,305,0,0,2,0,0,3148,7,7,2,0,0,0,9631
Xhosa,0,0,0,0,0,12,13,28,48,0,9,24,9,9,25,30,30,9,0,0,0,0
Eastern Yiddish,0,0,0,0,0,13,19,79226,79718,51950,124,139,123,143,79172,19,11,9,0,50451,0,50458
Yoruba,0,0,0,0,0,40,41,33312,157,8400,1793,1387,1793,1700,35824,66,50,17,4933,37923,0,50969
Yue Chinese,0,0,0,0,0,0,0,11752,28305,0,25,173,24,41,11604,0,0,0,17402,67301,0,0
Chinese (Simplified),0,0,0,0,0,0,0,14278,32640,0,0,74,0,0,14124,0,0,0,8752,68221,0,2003
Chinese (Traditional),0,0,0,0,0,0,0,12124,29301,0,31,205,30,54,12026,0,0,0,19325,68883,0,0
Standard Malay,0,0,0,0,0,2,3,33,63,0,8,10,8,10,31,8,8,1,0,0,0,0
Zulu,0,0,0,0,0,4,4,21,38,0,3,12,2,2,17,10,10,3,0,0,0,0
