| Script | Count |
|---|---|
| Arabic | 32,047 |
| CJK | 352,053 |
| Cyrillic | 10,497 |
| Greek | 906 |
| Hebrew | 20,246 |
| Other | 2,109 |
| Language | Count |
|---|---|
| No linguistic content | 43 |
| ch | 1 |
| 0ch | 1 |
| a a | 2 |
| aar Afar | 1 |
| alg Algonquian (Other) | 1 |
| ara Arabic | 27,927 |
| arc Aramaic | 34 |
| arm Armenian | 4 |
| ava Avaric | 1 |
| ave Avestan | 1 |
| aze Azerbaijani | 10 |
| bak Bashkir | 1 |
| bal Baluchi | 1 |
| bel Belarusian | 42 |
| ben Bengali | 6 |
| ber Berber (Other) | 4 |
| bos Bosnian | 1 |
| bul Bulgarian | 173 |
| bur Burmese | 1 |
| cha Chamorro | 1 |
| che Chechen | 2 |
| chg Chagatai | 2 |
| chi Chinese | 160,346 |
| cho Choctaw | 4 |
| chu Church Slavic | 6 |
| chv Chuvash | 2 |
| cop Coptic | 1 |
| crh Crimean Tatar | 2 |
| cze Czech | 3 |
| dan Danish | 1 |
| dut Dutch | 12 |
| eb| | 1 |
| egy Egyptian | 2 |
| eng English | 1,755 |
| est Estonian | 1 |
| fin Finnish | 2 |
| fiu Finno-Ugrian (Other) | 1 |
| fre French | 174 |
| geo Georgian | 6 |
| ger German | 76 |
| grc Greek, Ancient (to 1453) | 1 |
| gre Greek, Modern (1453- ) | 864 |
| heb Hebrew | 19,652 |
| hi | 2 |
| hin Hindi | 5 |
| hrv | 3 |
| ind Indonesian | 1 |
| ipk Inupiaq | 1 |
| ira Iranian (Other) | 1 |
| ita Italian | 18 |
| jav Javanese | 1 |
| jpn Japanese | 140,648 |
| jrb Judeo-Arabic | 8 |
| kaa Kara-Kalpak | 1 |
| kaz Kazakh | 9 |
| kir Kyrgyz | 4 |
| kom Komi | 1 |
| kor Korean | 48,937 |
| kur Kurdish | 13 |
| lad Ladino | 14 |
| lah Lahnda | 1 |
| lat Latin | 26 |
| mac Macedonian | 30 |
| mal Malayalam | 1 |
| man Mandingo | 1 |
| may Malay | 1 |
| mis Miscellaneous languages | 5 |
| mnc Manchu | 21 |
| mon Mongolian | 29 |
| mul Multiple languages | 101 |
| nog Nogai | 1 |
| ota Turkish, Ottoman | 34 |
| per Persian | 2,948 |
| pol Polish | 42 |
| por Portuguese | 4 |
| pus Pushto | 7 |
| raj Rajasthani | 1 |
| rum Romanian | 7 |
| rus Russian | 8,956 |
| sam Samaritan Aramaic | 13 |
| san Sanskrit | 14 |
| scc Serbian | 327 |
| scr Croatian | 6 |
| sit Sino-Tibetan (Other) | 2 |
| sla Slavic (Other) | 1 |
| snd Sindhi | 5 |
| spa Spanish | 13 |
| srp | 195 |
| swe Swedish | 1 |
| syr Syriac | 1 |
| tam Tamil | 14 |
| tat Tatar | 7 |
| tgk Tajik | 3 |
| tha Thai | 6 |
| tib Tibetan | 383 |
| tur Turkish | 16 |
| tut Altaic (Other) | 54 |
| tyv Tuvinian | 1 |
| uig Uighur | 1 |
| ukr Ukrainian | 552 |
| und Undetermined | 17 |
| urd Urdu | 1,292 |
| uzb Uzbek | 12 |
| vie Vietnamese | 2 |
| yid Yiddish | 1,718 |
| zxx No linguistic content | 26 |
| Location | Arabic | CJK | Cyrillic | Greek | Hebrew | Other |
|---|---|---|---|---|---|---|
| ACQeax | 0 | 5 | 0 | 0 | 0 | 0 |
| afst | 2 | 0 | 0 | 0 | 0 | 0 |
| ave | 73 | 208 | 37 | 2 | 31 | 1 |
| ave,anx2 | 0 | 0 | 0 | 0 | 1 | 0 |
| ave4off | 4 | 2 | 17 | 1 | 1 | 2 |
| avr | 0 | 11 | 7 | 0 | 0 | 0 |
| bar | 3 | 7 | 1 | 0 | 0 | 0 |
| bar,medi | 2 | 12 | 1 | 0 | 0 | 0 |
| bar,over | 0 | 0 | 1 | 0 | 0 | 0 |
| bmc | 9 | 73 | 3 | 0 | 1 | 3 |
| bmc,res | 29 | 212 | 13 | 0 | 7 | 3 |
| bus | 100 | 21 | 21 | 0 | 25 | 2 |
| bus4off | 2 | 1 | 1 | 0 | 0 | 0 |
| busn | 0 | 3 | 0 | 0 | 0 | 0 |
| comp | 0 | 1 | 0 | 0 | 0 | 0 |
| dis | 0 | 1 | 0 | 0 | 0 | 0 |
| docs | 0 | 1 | 0 | 0 | 0 | 0 |
| eal | 0 | 367 | 1 | 0 | 0 | 0 |
| eal,anx2 | 0 | 1 | 0 | 0 | 0 | 0 |
| eal,rare | 0 | 2 | 0 | 0 | 0 | 0 |
| eal,ref | 0 | 23 | 0 | 0 | 0 | 1 |
| eal,spec | 0 | 2 | 0 | 0 | 0 | 0 |
| eal4off | 0 | 10 | 1 | 0 | 0 | 0 |
| ean | 0 | 1 | 0 | 0 | 0 | 0 |
| eax | 0 | 163,966 | 12 | 1 | 0 | 0 |
| eax,anx2 | 0 | 603 | 0 | 0 | 0 | 0 |
| eax,cage | 0 | 15 | 0 | 0 | 0 | 0 |
| eax,fol | 0 | 12 | 0 | 0 | 0 | 0 |
| eax,rare | 0 | 1,887 | 0 | 0 | 0 | 0 |
| eax,ref | 1 | 2,526 | 1 | 0 | 0 | 0 |
| eax,ref2 | 0 | 36 | 0 | 0 | 0 | 0 |
| eax,res | 0 | 1 | 0 | 0 | 0 | 0 |
| eax,sem | 0 | 1 | 0 | 0 | 0 | 0 |
| eax,sky | 0 | 270 | 0 | 0 | 0 | 0 |
| eax,spec | 0 | 3,922 | 0 | 0 | 0 | 0 |
| eax4off | 0 | 2,126 | 0 | 0 | 0 | 1 |
| egyp | 3 | 0 | 0 | 0 | 0 | 0 |
| eng | 0 | 1 | 0 | 0 | 0 | 0 |
| eng,ref | 0 | 3 | 0 | 0 | 0 | 0 |
| far | 0 | 3 | 0 | 0 | 0 | 0 |
| far,stor | 0 | 0 | 0 | 0 | 1 | 0 |
| fax | 53 | 728 | 55 | 1 | 87 | 2 |
| fax,ref | 0 | 1 | 0 | 0 | 0 | 0 |
| fax4off | 4 | 5 | 24 | 0 | 0 | 1 |
| gax | 0 | 3 | 19 | 0 | 5 | 0 |
| glg | 2 | 3 | 0 | 0 | 1 | 0 |
| glx | 15,902 | 26 | 1,804 | 552 | 7,775 | 327 |
| glx,anx | 1 | 0 | 0 | 0 | 0 | 0 |
| glx,fol | 1 | 0 | 3 | 1 | 3 | 0 |
| glx4off | 260 | 4 | 170 | 14 | 9 | 252 |
| glxn | 22 | 0 | 34 | 1 | 0 | 0 |
| gsc | 0 | 2 | 0 | 0 | 0 | 0 |
| gsc4off | 0 | 2 | 0 | 0 | 0 | 0 |
| hsl,clncy | 0 | 12 | 1 | 0 | 2 | 0 |
| hsl,stx | 0 | 1 | 0 | 1 | 0 | 0 |
| islm | 1,085 | 1 | 0 | 0 | 4 | 1 |
| jou | 0 | 0 | 1 | 0 | 0 | 0 |
| leh | 2,869 | 10 | 282 | 2 | 813 | 65 |
| leh,atls | 0 | 0 | 1 | 0 | 0 | 0 |
| leh,ref | 5 | 0 | 0 | 0 | 0 | 0 |
| leh,tib | 0 | 10 | 0 | 0 | 0 | 0 |
| leh4off | 33 | 0 | 75 | 0 | 0 | 4 |
| lehn | 3 | 2 | 1 | 0 | 0 | 0 |
| lsp | 0 | 0 | 0 | 0 | 4 | 0 |
| lweb | 221 | 5,750 | 614 | 3 | 406 | 4 |
| lweb,docs | 2 | 2 | 1 | 3 | 0 | 0 |
| lweb,ref | 0 | 35 | 4 | 0 | 2 | 0 |
| manc | 1 | 0 | 0 | 0 | 0 | 0 |
| map | 0 | 1 | 3 | 0 | 0 | 0 |
| mat | 1 | 1 | 1 | 0 | 0 | 0 |
| mat,ser | 0 | 1 | 0 | 0 | 0 | 0 |
| mil | 3 | 4 | 1 | 0 | 5 | 1 |
| mrr | 2 | 1 | 145 | 0 | 10 | 0 |
| msc | 0 | 16 | 3 | 0 | 2 | 6 |
| msc,ref | 0 | 1 | 2 | 0 | 0 | 0 |
| msc4off | 0 | 0 | 2 | 0 | 0 | 0 |
| msr | 4 | 9 | 1 | 1 | 1 | 0 |
| msr4off | 0 | 0 | 0 | 0 | 0 | 3 |
| mus | 69 | 4 | 15 | 8 | 12 | 2 |
| mus,case | 0 | 0 | 1 | 0 | 1 | 0 |
| mus,ref | 2 | 0 | 3 | 0 | 1 | 0 |
| mus4off | 0 | 1 | 3 | 0 | 0 | 4 |
| off,ave | 94 | 88 | 256 | 22 | 76 | 7 |
| off,bio | 0 | 3 | 1 | 0 | 0 | 0 |
| off,bmc | 4 | 29 | 0 | 0 | 2 | 0 |
| off,bus | 70 | 10 | 51 | 0 | 26 | 3 |
| off,che | 0 | 3 | 1 | 0 | 0 | 0 |
| off,dic | 0 | 2 | 0 | 0 | 0 | 0 |
| off,docs | 0 | 1 | 0 | 0 | 0 | 0 |
| off,eal | 0 | 195 | 0 | 0 | 0 | 0 |
| off,ean | 0 | 2 | 0 | 0 | 0 | 0 |
| off,eax | 1 | 171,319 | 8 | 1 | 0 | 1 |
| off,eng | 1 | 1 | 1 | 0 | 0 | 0 |
| off,far | 0 | 0 | 0 | 1 | 2 | 0 |
| off,fax | 35 | 336 | 438 | 11 | 56 | 6 |
| off,glg | 1 | 1 | 12 | 0 | 4 | 0 |
| off,glx | 10,076 | 30 | 5,371 | 267 | 9,620 | 810 |
| off,gsc | 0 | 7 | 4 | 0 | 0 | 0 |
| off,hsr | 0 | 6 | 0 | 0 | 1 | 0 |
| off,jou | 0 | 0 | 1 | 0 | 0 | 0 |
| off,leh | 1,013 | 11 | 645 | 0 | 560 | 29 |
| off,les | 1 | 0 | 0 | 0 | 0 | 0 |
| off,mat | 0 | 0 | 1 | 0 | 0 | 0 |
| off,msc | 0 | 0 | 5 | 0 | 15 | 0 |
| off,mus | 26 | 3 | 86 | 1 | 20 | 2 |
| off,mvr | 0 | 1 | 0 | 0 | 0 | 0 |
| off,phy | 0 | 1 | 0 | 0 | 0 | 0 |
| off,prd | 1 | 1,168 | 1 | 0 | 2 | 0 |
| off,psy | 0 | 0 | 0 | 0 | 1 | 0 |
| off,rbx | 0 | 1 | 0 | 0 | 6 | 0 |
| off,ref | 3 | 0 | 0 | 0 | 0 | 0 |
| off,sci | 7 | 1 | 0 | 0 | 2 | 0 |
| off,swx | 0 | 1 | 0 | 0 | 10 | 0 |
| off,utmrl | 6 | 86 | 0 | 0 | 0 | 0 |
| off,utn | 6 | 2 | 4 | 0 | 5 | 1 |
| off,utp | 0 | 1 | 0 | 0 | 2 | 0 |
| off,uts | 10 | 31 | 3 | 0 | 13 | 0 |
| off,war | 0 | 0 | 0 | 0 | 2 | 0 |
| pap | 0 | 0 | 0 | 3 | 0 | 0 |
| prd | 0 | 79 | 0 | 0 | 0 | 0 |
| pren,eax | 0 | 66 | 0 | 0 | 0 | 0 |
| psy | 0 | 0 | 0 | 0 | 1 | 0 |
| rbx | 6 | 15 | 264 | 0 | 553 | 528 |
| ref | 3 | 1 | 12 | 1 | 8 | 0 |
| ref,casm | 0 | 0 | 1 | 0 | 0 | 0 |
| said | 214 | 0 | 0 | 0 | 0 | 1 |
| sho | 0 | 7 | 6 | 0 | 2 | 0 |
| swx | 0 | 2 | 0 | 0 | 2 | 0 |
| ushi | 0 | 1 | 0 | 0 | 0 | 0 |
| uts | 45 | 22 | 17 | 9 | 23 | 2 |
| uts,fil | 0 | 1 | 0 | 0 | 0 | 0 |
| uts,gil | 2 | 0 | 0 | 0 | 7 | 0 |
| uts,locxxf | 0 | 0 | 0 | 0 | 1 | 0 |
| uts,mrld | 0 | 0 | 0 | 0 | 1 | 0 |
| uts,mrlo | 0 | 42 | 0 | 0 | 0 | 0 |
| uts,mrlxxp | 0 | 10 | 0 | 0 | 0 | 0 |
| uts,per | 0 | 50 | 0 | 0 | 1 | 0 |
| uts,perxxf | 0 | 1 | 0 | 0 | 0 | 1 |
| uts,ref | 0 | 0 | 0 | 0 | 1 | 0 |
| uts,tms | 0 | 0 | 0 | 0 | 1 | 0 |
| uts,twr | 9 | 0 | 0 | 0 | 1 | 0 |
| uts,unn | 1 | 8 | 1 | 0 | 30 | 0 |
| uts,unnr | 9 | 0 | 0 | 0 | 19 | 4 |
| uts,unnrxf | 0 | 0 | 0 | 0 | 2 | 0 |
| uts4off | 1 | 0 | 0 | 1 | 0 | 0 |
| war | 0 | 1 | 1 | 0 | 1 | 0 |