diff options
Diffstat (limited to 'libtextcat/data/new_fingerprints/lm/croatian.lm')
-rw-r--r-- | libtextcat/data/new_fingerprints/lm/croatian.lm | 400 |
1 files changed, 400 insertions, 0 deletions
diff --git a/libtextcat/data/new_fingerprints/lm/croatian.lm b/libtextcat/data/new_fingerprints/lm/croatian.lm new file mode 100644 index 000000000000..b054ac34ab89 --- /dev/null +++ b/libtextcat/data/new_fingerprints/lm/croatian.lm @@ -0,0 +1,400 @@ +_ 36598 +a 9456 +o 9050 +i 8526 +e 7955 +n 5513 +j 5379 +s 4971 +t 4125 +r 3889 +u 3423 +je 3281 +l 3231 +e_ 3177 +d 3128 +k 2992 +v 2891 +a_ 2835 +o_ 2679 +m 2645 +p 2316 +_s 2212 +i_ 2205 +y 2174 +c 1894 +z 1867 +je_ 1613 +_n 1593 +g 1581 +_p 1490 +b 1386 +u_ 1382 +, 1208 +,_ 1208 +st 1203 +_j 1202 +na 1159 +_je 1118 +_d 1105 +_i 1104 +. 1069 +._ 1058 +ra 1017 +ko 981 +ni 980 +_je_ 918 +ij 914 +ti 911 +no 891 +da 884 +to 879 +_k 863 +_o 856 +cy 839 +li 838 +ne 790 +sy 786 +- 785 +pr 760 +_u 748 +po 734 +ta 711 +_b 705 +_t 704 +la 699 +ja 699 +an 691 +m_ 680 +ov 674 +ije 673 +_z 669 +ka 662 +ri 652 +lo 651 +vo 643 +re 641 +is 626 +in 623 +se 623 +va 622 +_m 617 +oj 614 +_po 594 +_pr 592 +bi 588 +en 582 +il 578 +os 576 +vi 572 +nj 569 +ak 564 +_na 558 +im 558 +da_ 553 +od 550 +ao 550 +al 549 +om 545 +na_ 533 +_se 524 +_i_ 523 +h 517 +_g 511 +ma 508 +at 502 +cj 501 +og 497 +-- 493 +ro 493 +on 485 +av 480 +_da 474 +_ne 474 +ed 472 +zy 471 +se_ 466 +_se_ 458 +_bi 457 +ao_ 452 +ad 452 +lj 445 +es 444 +ji 441 +_v 433 +_c 430 +za 421 +go 418 +_r 413 +_u_ 411 +yi 410 +ek 406 +di 403 +sa 396 +et 393 +ic 391 +io 390 +_da_ 389 +to_ 389 +as 386 +_ko 383 +ye 378 +ar 378 +mo 373 +le 367 +or 364 +ju 363 +el 354 +tr 354 +io_ 352 +ve 345 +lo_ 344 +su 344 +ol 344 +am 344 +iz 343 +li_ 338 +ti_ 336 +sto 323 +n_ 321 +it 319 +_za 319 +sta 317 +_ni 316 +te 312 +nu 312 +a, 309 +a,_ 309 +ya 309 +do 304 +om_ 303 +la_ 300 +no_ 299 +_na_ 299 +d_ 297 +ko_ 296 +aj 294 +ik 292 +ru 291 +ga 291 +em 288 +nje 283 +dj 281 +ne_ 281 +k_ 277 +_st 276 +koj 276 +ec 274 +_ka 272 +_su 270 +ob 265 +-_ 263 +az 261 +sv 260 +_koj 260 +im_ 260 +ije_ 259 +pa 258 +ot 257 +yt 256 +ok 255 +su_ 255 +ih 254 +me 253 +dn 253 +_cy 253 +iv 251 +syt 248 +g_ 247 +--_ 246 +_- 246 +kr 246 +--- 246 +a. 245 +e,_ 245 +---_ 245 +e, 245 +er 245 +a._ 244 +_iz 244 +mi 243 +_---_ 242 +cyi 242 +_-- 242 +_--- 242 +jed 240 +h_ 239 +_a 239 +_sa 237 +j_ 236 +_l 231 +_sv 229 +_to 229 +sk 228 +ih_ 224 +ja_ 223 +pro 223 +yn 222 +t_ 222 +ost 221 +_do 221 +oc 219 +gl 218 +_su_ 216 +og_ 216 +uc 214 +s_ 214 +bil 213 +oz 213 +ki 212 +ni_ 212 +nij 209 +ako 208 +eg 208 +ut 205 +pre 205 +ci 204 +ji_ 203 +_od 203 +ilo 202 +ati 202 +ac 201 +ns 200 +_mo 197 +rij 196 +bo 195 +ovo 195 +ku 195 +dje 194 +ma_ 192 +_bil 191 +cje 186 +sti 186 +_go 186 +de 185 +sl 183 +_pro 182 +ju_ 182 +nije 181 +tv 180 +lje 179 +isy 179 +pri 178 +_pre 177 +dr 177 +e._ 177 +e. 177 +op 176 +ima 176 +anj 175 +jen 175 +us 172 +ilo_ 172 +_ra 170 +S 167 +ecj 166 +iti 166 +sp 163 +_S 161 +vr 161 +i. 161 +i._ 161 +zn 161 +ali 161 +i,_ 160 +i, 160 +ap 157 +nije_ 157 +nst 156 +pi 156 +ga_ 156 +_sy 155 +_nj 155 +jes 155 +ran 155 +vo_ 155 +yto 154 +ev 153 +_to_ 152 +_pri 151 +est 150 +N 150 +ins 150 +ist 149 +ir 149 +o, 148 +vj 148 +vje 148 +o,_ 148 +B 148 +zi 147 +jec 147 +gov 147 +yto_ 147 +syto 146 +ton 146 +od_ 145 +O 144 +rije 144 +lik 143 +on_ 142 +ocy 142 +W 142 +ba 142 +_W 141 +kao 141 +Wi 141 +_N 141 +inst 141 +_nij 141 +_nije 140 +_Wi 140 +syto_ 140 +lic 139 +P 139 +ovi 138 +_tr 138 +rs 137 +ez 137 +edn 136 +_P 136 +si 136 +ili 136 +du 136 +Winst 135 +cye 135 +nston 135 +ston 135 +ud 135 +kao_ 135 +Wins 135 +insto 135 +oji 135 +nsto 135 +Win 135 +raz 135 +zye 135 +_Win 134 +ova 134 +_Wins 134 +_on 133 +ako_ 133 +odi 133 +cya 133 +ila 133 +icy 133 +oj_ 133 +ke 133 +va_ 132 +ija 132 +_is 132 +jel 132 +oje 130 +pu 130 +cje_ 130 +bi_ 129 +rat 128 +ce 128 +tu 128 +mu 128 +ve_ 127 |