diff options
Diffstat (limited to 'libtextcat/data/new_fingerprints/lm/swahili.lm')
-rw-r--r-- | libtextcat/data/new_fingerprints/lm/swahili.lm | 400 |
1 files changed, 400 insertions, 0 deletions
diff --git a/libtextcat/data/new_fingerprints/lm/swahili.lm b/libtextcat/data/new_fingerprints/lm/swahili.lm new file mode 100644 index 000000000000..56090b40153e --- /dev/null +++ b/libtextcat/data/new_fingerprints/lm/swahili.lm @@ -0,0 +1,400 @@ +_ 16483 +a 9342 +i 5293 +a_ 4071 +u 2730 +k 2609 +n 2351 +w 2076 +m 1928 +e 1866 +h 1800 +o 1775 +wa 1743 +l 1486 +s 1419 +i_ 1401 +t 1399 +_k 1306 +y 1100 +_w 969 +li 945 +wa_ 911 +z 891 +_wa 890 +ka 834 +ku 799 +r 770 +b 733 +an 727 +ma 723 +o_ 711 +_m 707 +na 698 +ya 675 +ha 672 +g 602 +al 580 +d 570 +at 560 +am 554 +_n 549 +_ku 549 +ik 543 +_h 515 +ya_ 514 +A 494 +is 487 +_y 485 +hi 474 +na_ 471 +_ya 471 +ta 468 +sh 456 +ali 449 +j 426 +u_ 423 +ki 418 +e_ 402 +p 401 +ti 401 +_wa_ 399 +f 392 +_ya_ 390 +ba 390 +ri 385 +ng 385 +il 380 +c 358 +hu 356 +_na 356 +ni 355 +za 354 +zi 351 +ia 344 +_na_ 343 +_a 336 +in 327 +_ma 326 +ch 322 +mb 317 +ika 314 +. 311 +._ 309 +_ka 307 +as 306 +ak 306 +ati 301 +, 300 +ka_ 296 +,_ 294 +_u 292 +kw 286 +ili 278 +K 274 +en 271 +si 266 +_kw 262 +la 261 +ni_ 261 +ma_ 261 +_s 258 +kwa 258 +ar 256 +ut 245 +za_ 245 +nd 242 +mba 241 +_kwa 239 +_z 234 +li_ 233 +un 233 +ny 230 +it 229 +se 229 +yo 227 +ia_ 222 +M 221 +sa 221 +kat 217 +_K 214 +_i 213 +ika_ 213 +ana 212 +ish 212 +kati 206 +_ha 204 +on 201 +ai 200 +I 198 +aa 196 +um 195 +im 190 +v 188 +mu 187 +amb 187 +sha 185 +em 183 +fa 181 +zi_ 180 +di 179 +mi 178 +_M 178 +us 176 +_ki 176 +ha_ 175 +iw 172 +ama 172 +_kat 168 +_kati 168 +_hi 166 +_l 166 +ra 166 +kwa_ 165 +la_ 164 +W 164 +ja 163 +U 163 +N 163 +amba 161 +ao 161 +_za 160 +ji 160 +B 157 +iwa 155 +tik 155 +wal 155 +le 155 +tika 154 +ge 153 +lis 153 +tu 152 +atika 152 +to 152 +atik 152 +uw 152 +_kwa_ 151 +A_ 151 +ke 150 +S 147 +tika_ 145 +aj 145 +we 144 +cha 144 +bi 141 +az 140 +er 139 +ek 138 +katik 138 +ez 138 +uwa 137 +kut 135 +_al 134 +_B 134 +ad 134 +mu_ 133 +_ali 133 +rik 132 +_W 131 +ba_ 131 +kuw 131 +me 130 +ali_ 128 +kuwa 128 +ema 127 +wan 127 +bu 126 +sem 126 +_A 125 +ir 125 +ata 125 +iz 124 +_hu 124 +ay 124 +ul 124 +af 123 +iki 122 +ema_ 121 +da 120 +ti_ 120 +sema 119 +aka 118 +sema_ 118 +te 118 +uz 117 +yo_ 117 +_v 117 +io 116 +iy 115 +uta 115 +ani 115 +_wal 115 +he 115 +if 114 +_la 114 +ab 114 +go 112 +_za_ 111 +ama_ 111 +sa_ 111 +pa 110 +_t 110 +zo 110 +nge 110 +wam 109 +wali 108 +ua 107 +ur 106 +_c 106 +ise 105 +_ch 105 +isem 105 +ho 105 +ye 104 +iyo 104 +E 104 +el 104 +mo 103 +ung 103 +eri 103 +_wali 103 +_b 102 +mba_ 102 +ari 101 +ita 101 +isema 100 +ot 99 +_la_ 99 +uk 99 +ao_ 99 +di_ 99 +sha_ 99 +ini 99 +kuwa_ 98 +uwa_ 98 +ana_ 98 +lise 98 +lisem 98 +uli 97 +shi 97 +ga 96 +iwa_ 96 +fu 96 +T 96 +R 95 +_il 95 +wak 94 +aw 94 +isha 94 +ri_ 93 +_am 93 +ara 92 +_cha 92 +aji 92 +_ili 91 +ifa 91 +O 90 +_p 90 +uh 90 +iri 90 +chi 90 +asi 89 +po 89 +a. 89 +ong 89 +azi 88 +_j 88 +_kut 88 +eny 88 +nc 88 +a._ 88 +ko 87 +uu 87 +id 87 +w_ 87 +no 87 +P 86 +ah 86 +ina 86 +rika 86 +_Bw 85 +H 85 +gu 85 +uo 85 +Bw_ 85 +_Bw_ 85 +_se 85 +Bw 85 +ib 84 +_S 84 +kam 84 +hi_ 84 +nya 84 +si_ 83 +a, 82 +no_ 81 +pi 81 +ok 81 +i. 81 +ip 81 +kwam 81 +i._ 81 +amba_ 80 +dh 80 +end 80 +ani_ 80 +a,_ 79 +wamb 79 +kwamb 79 +_sh 79 +eza 79 +nz 79 +wi 79 +_kwam 79 +wamba 79 +alis 78 +_kuw 78 +ngo 78 +ap 77 +_N 77 +any 77 +ili_ 77 +C 77 +WA 76 +vy 76 +wana 76 +_hiy 75 +Wa 75 +hiyo 75 +nch 75 +_hiyo 75 +de 75 +_kuwa 75 +ing 75 +hiy 75 +vi 75 +isha_ 74 +es 74 +atu 74 +_Wa 74 +nchi 74 +aki 74 +lim 73 +da_ 73 +ini_ 73 +ash 73 +ala 73 +i, 73 +ano 73 +i,_ 72 +_kam 71 +_wan 71 +ano_ 71 +mw 71 +nde 71 +ji_ 71 +ion 70 +_amb 70 +ndi 70 +_Ka 70 +eza_ 70 |