diff options
Diffstat (limited to 'libtextcat/data/new_fingerprints/lm/romanian.lm')
-rw-r--r-- | libtextcat/data/new_fingerprints/lm/romanian.lm | 400 |
1 files changed, 400 insertions, 0 deletions
diff --git a/libtextcat/data/new_fingerprints/lm/romanian.lm b/libtextcat/data/new_fingerprints/lm/romanian.lm new file mode 100644 index 000000000000..65b8e7554d8e --- /dev/null +++ b/libtextcat/data/new_fingerprints/lm/romanian.lm @@ -0,0 +1,400 @@ +_ 20674 +a 6376 +e 5815 +i 5746 +t 3396 +r 3280 +n 3103 +u 2835 +s 2611 +c 2582 +e_ 2235 +l 2224 +o 2149 +a_ 1974 +d 1629 +m 1528 +p 1410 +i_ 1358 +in 1308 +_c 1167 +_s 1118 +_d 999 +re 905 +ar 898 +, 791 +,_ 786 +_p 785 +de 771 +_a 754 +te 687 +_i 667 +at 654 +ti 645 +ca 639 +n_ 630 +ta 617 +si 614 +_de 609 +f 606 +st 583 +ri 581 +u_ 567 +nt 553 +. 542 +ra 540 +_m 534 +g 528 +v 516 +ul 516 +de_ 513 +_in 503 +b 492 +_de_ 474 +._ 472 +le 459 +l_ 444 +un 443 +_si 440 +es 437 +tr 426 +ea 420 +t_ 412 +ce 412 +ma 407 +cu 402 +er 398 +_ca 397 +si_ 388 +_f 387 +_l 383 +z 382 +la 381 +ne 370 +sa 364 +as 360 +_e 357 +in_ 356 +an 352 +it 351 +te_ 346 +or 345 +el 345 +ci 339 +_si_ 333 +_n 330 +are 324 +pe 319 +re_ 317 +al 310 +_t 309 +se 304 +ic 295 +ie 290 +_u 290 +ul_ 290 +ni 289 +int 285 +_o 280 +en 279 +ta_ 279 +ur 261 +pa 256 +co 255 +_pe 254 +ia 252 +mi 251 +pr 249 +_ma 249 +oa 249 +me 246 +lu 246 +li 241 +im 238 +_in_ 237 +da 237 +na 237 +_sa 235 +ac 234 +- 234 +ii 232 +est 231 +r_ 231 +h 230 +_cu 230 +le_ 229 +ai 229 +ca_ 227 +il 226 +ru 223 +sc 223 +_v 221 +nu 220 +tu 220 +_un 220 +nd 220 +di 219 +are_ 216 +to 215 +am 214 +on 213 +o_ 208 +is 208 +sa_ 203 +la_ 200 +_b 200 +ste 195 +et 194 +ec 191 +_r 186 +car 185 +ui 180 +un_ 179 +lo 178 +cu_ 177 +ei 176 +e, 175 +e,_ 175 +pe_ 171 +m_ 167 +_la 166 +a, 165 +a,_ 164 +_ce 164 +rt 163 +_co 163 +ent 162 +ro 162 +ele 162 +_pe_ 160 +po 160 +ea_ 159 +" 158 +ntr 158 +_cu_ 158 +_pr 157 +ut 157 +nc 156 +ata 155 +care 154 +um 153 +au 151 +va 151 +_o_ 150 +_car 150 +ii_ 145 +ind 145 +_un_ 144 +os 144 +ad 141 +_la_ 140 +I 140 +este 138 +ste_ 138 +care_ 138 +ir 137 +ga 136 +ap 136 +ol 136 +ra_ 136 +_di 134 +D 134 +_care 133 +se_ 133 +om 133 +ara 133 +ati 133 +fi 133 +_sa_ 131 +zi 130 +vi 130 +_ca_ 129 +_se 128 +_nu 128 +ai_ 127 +ch 127 +pi 124 +ve 123 +fa 122 +ot 121 +_a_ 120 +este_ 120 +du 119 +ine 119 +s_ 118 +fo 118 +_ci 118 +ui_ 118 +ba 118 +i, 117 +i,_ 116 +ne_ 115 +us 115 +_g 115 +a. 115 +fe 114 +A 114 +pu 114 +ce_ 113 +ar_ 113 +_pa 113 +oc 112 +sta 112 +lui 112 +ns 112 +em 112 +' 112 +oar 112 +din 111 +iu 111 +_int 111 +ate 111 +mu 111 +hi 110 +ele_ 110 +mp 109 +_D 109 +S 109 +sti 108 +bi 108 +ata_ 107 +ti_ 107 +tra 107 +C 107 +c_ 106 +tre 106 +_al 105 +rea 105 +mai 105 +j 104 +a._ 104 +gi 104 +e. 103 +d_ 103 +_fa 103 +E 102 +mo 102 +at_ 101 +_e_ 101 +nte 101 +lt 101 +sp 101 +za 100 +mai_ 100 +su 99 +na_ 98 +tat 97 +sin 97 +ez 96 +tru 96 +e._ 96 +ie_ 96 +ia_ 96 +_re 96 +tul 96 +_fo 96 +ina 95 +art 95 +_C 95 +no 95 +nu_ 94 +_es 94 +_po 94 +cr 94 +inc 93 +_da 92 +_mai 92 +lui_ 92 +_din 92 +_est 92 +pre 91 +_mai_ 91 +io 91 +chi 91 +ge 90 +pri 90 +eu 90 +uri 90 +az 90 +_nu_ 89 +_me 89 +ct 89 +au_ 88 +esc 88 +ev 88 +ei_ 88 +min 87 +ace 87 +op 86 +ng 86 +ici 86 +_lu 85 +ari 85 +_mi 84 +ita 84 +_S 84 +_tr 84 +ere 83 +or_ 83 +ast 83 +ist 83 +nt_ 83 +_se_ 82 +ou 82 +tin 82 +intr 82 +con 82 +do 81 +_fi 81 +str 81 +am_ 80 +rat 80 +ru_ 80 +ri_ 80 +par 80 +oi 80 +uc 79 +ze 79 +pl 79 +res 78 +_ac 77 +ulu 77 +din_ 76 +va_ 76 +ada 76 +ului 75 +_con 75 +id 75 +inte 74 +ile 73 +cit 73 +_din_ 73 +lor 73 +_" 72 +ig 72 +rin 72 +da_ 72 +_st 72 +-_ 71 +_- 71 +it_ 71 +ani 71 +nd_ 71 +ci_ 70 +ag 70 +eri 70 +i. 70 +tru_ 70 +_ne 70 +rm 70 +P 69 +_este 69 +nta 69 +bu 69 +une 69 +ma_ 69 +nti 69 +imp 68 +_-_ 68 +iv 68 +ind_ 68 |