diff options
Diffstat (limited to 'libtextcat/data/new_fingerprints/lm/estonian.lm')
-rw-r--r-- | libtextcat/data/new_fingerprints/lm/estonian.lm | 400 |
1 files changed, 400 insertions, 0 deletions
diff --git a/libtextcat/data/new_fingerprints/lm/estonian.lm b/libtextcat/data/new_fingerprints/lm/estonian.lm new file mode 100644 index 000000000000..74a7aa014324 --- /dev/null +++ b/libtextcat/data/new_fingerprints/lm/estonian.lm @@ -0,0 +1,400 @@ +_ 20738 +a 7004 +e 5699 +i 5321 +s 4731 +t 3769 +l 3448 +u 3446 +n 2902 +k 2584 +d 2202 +m 2043 +a_ 1758 +o 1684 +r 1429 +g 1174 +v 1151 +e_ 1139 +i_ 1136 +_k 1136 +s_ 1077 +h 1009 +, 995 +,_ 995 +_t 953 +p 953 +j 940 +ä 900 +is 896 +st 851 +se 841 +_s 822 +. 821 +as 801 +d_ 801 +le 800 +ta 794 +in 793 +_m 790 +ô 754 +._ 753 +t_ 746 +ma 710 +_p 680 +si 677 +_v 660 +es 636 +al 626 +us 619 +el 602 +_o 596 +_e 586 +ja 580 +_j 563 +te 562 +ü 549 +li 532 +va 515 +id 501 +ol 498 +tu 497 +da 490 +_n 480 +ku 478 +ud 459 +nu 455 +na 438 +ei 432 +ks 418 +mi 411 +ee 411 +u_ 407 +ka 400 +n_ 394 +b 394 +ga 386 +_l 384 +_a 380 +an 366 +ja_ 365 +et 358 +me 358 +l_ 350 +at 348 +la 341 +ad 340 +st_ 339 +ne 336 +ll 333 +_ta 332 +ra 330 +_ja 328 +ik 323 +en 318 +ni 308 +ul 305 +sa 302 +_ol 302 +nd 299 +_ja_ 299 +nud 296 +ii 291 +ko 286 +_se 285 +le_ 283 +aa 281 +is_ 281 +gi 270 +_te 269 +ag 269 +_va 268 +_ku 267 +ed 262 +em 255 +_mi 255 +ma_ 247 +ti 246 +ri 245 +_h 242 +gu 239 +id_ 238 +ast 237 +it 236 +ga_ 236 +un 232 +de 230 +ud_ 230 +ha 230 +ak 228 +ah 228 +uu 228 +il 227 +ôi 226 +as_ 223 +ke 222 +ar 220 +a, 220 +am 220 +_ko 220 +a,_ 220 +_ka 220 +ai 220 +eg 216 +sin 214 +est 214 +ui 214 +he 214 +ks_ 213 +ö 213 +oo 213 +ju 207 +är 205 +ut 203 +in_ 203 +oli 201 +ki 199 +su 199 +es_ 199 +lt 198 +ist 188 +li_ 186 +ea 186 +vi 184 +im 181 +mu 181 +se_ 180 +ts 180 +on 178 +ise 178 +ta_ 177 +ek 176 +_oli 176 +sel 173 +nud_ 173 +_ü 172 +a. 171 +nn 170 +ema 169 +ng 168 +lu 168 +ge 167 +_si 166 +_ei 165 +_i 165 +_ei_ 164 +ei_ 164 +_r 163 +ole 161 +pa 160 +lle 160 +a._ 160 +ust 159 +du 156 +er 156 +vô 153 +da_ 153 +min 152 +et_ 151 +d,_ 149 +_M 149 +ht 149 +d, 149 +M 149 +kui 148 +_et 147 +K 147 +_K 146 +pe 145 +gi_ 145 +_vô 145 +or 144 +_tu 142 +lt_ 141 +_ma 141 +asi 140 +ve 139 +us_ 138 +ig 136 +sin_ 136 +ur 135 +_ta_ 134 +di 134 +_et_ 134 +s,_ 132 +tas 132 +s, 132 +_kui 131 +sk 131 +re 130 +po 129 +oli_ 129 +om 129 +äi 128 +inu 128 +_na 128 +_oli_ 128 +_sa 128 +aj 128 +mis 127 +ui_ 127 +_me 127 +_pa 126 +tus 125 +pi 125 +te_ 124 +ül 123 +- 123 +est_ 122 +_on 121 +kk 121 +tt 120 +aga 119 +na_ 119 +_T 119 +T 119 +b_ 118 +al_ 118 +sta 118 +_mu 116 +_ju 116 +ida 116 +aks 116 +gu_ 116 +_ni 116 +s. 116 +ad_ 116 +_pe 114 +eks 114 +ev 114 +end 113 +s._ 113 +use 111 +ära 111 +_po 111 +_min 110 +S 110 +aja 110 +_la 110 +ele 109 +el_ 108 +on_ 108 +ab 108 +_S 108 +av 107 +ing 107 +kui_ 106 +_on_ 106 +au 104 +ne_ 104 +ti_ 104 +ell 103 +ae 101 +kô 101 +ed_ 100 +_ke 99 +ata 99 +iis 99 +! 98 +!_ 98 +sid 98 +nda 98 +eh 98 +lle_ 97 +pu 97 +ää 97 +vôi 97 +ine 96 +t, 96 +e,_ 96 +ale 96 +_vôi 96 +t,_ 96 +e, 96 +eda 96 +uk 95 +ast_ 95 +ld 95 +? 94 +_kui_ 94 +_sel 93 +_kô 93 +tul 93 +ega 93 +lg 92 +sii 92 +val 92 +e. 92 +_su 92 +ug 92 +oh 92 +kü 92 +d. 91 +ee_ 91 +see 91 +e._ 91 +öö 91 +oma 91 +_ole 90 +ses 90 +stu 90 +ôt 90 +üü 90 +_om 89 +me_ 89 +ot 89 +d._ 89 +_sii 88 +to 88 +_en 87 +atu 87 +?_ 87 +A 86 +J 86 +pea 86 +jä 85 +_A 85 +_see 85 +ime 84 +_pi 84 +_ha 84 +mô 84 +nä 84 +_J 84 +les 84 +ste 84 +kas 84 +_ä 84 +vä 83 +E 83 +pä 83 +_ve 83 +_E 83 +eis 82 +_jä 81 +_pea 81 +_mô 80 +um 80 +_kü 80 +iku 80 +üd 80 +all 79 +eid 79 +ba 79 +_vä 79 +ina 78 +lj 78 +sid_ 78 +hu 78 +tun 78 +lä 78 +_oma 77 +i,_ 77 +i, 77 +agu 77 +uh 77 +lm 76 +ras 76 +ss 76 +kä 76 +ees 76 |